1 #include <linux/in.h>
2
3 #include "super.h"
4 #include "mds_client.h"
5 #include <linux/ceph/ceph_debug.h>
6
7 #include "ioctl.h"
8
9
10 /*
11 * ioctls
12 */
13
14 /*
15 * get and set the file layout
16 */
ceph_ioctl_get_layout(struct file * file,void __user * arg)17 static long ceph_ioctl_get_layout(struct file *file, void __user *arg)
18 {
19 struct ceph_inode_info *ci = ceph_inode(file->f_dentry->d_inode);
20 struct ceph_ioctl_layout l;
21 int err;
22
23 err = ceph_do_getattr(file->f_dentry->d_inode, CEPH_STAT_CAP_LAYOUT);
24 if (!err) {
25 l.stripe_unit = ceph_file_layout_su(ci->i_layout);
26 l.stripe_count = ceph_file_layout_stripe_count(ci->i_layout);
27 l.object_size = ceph_file_layout_object_size(ci->i_layout);
28 l.data_pool = le32_to_cpu(ci->i_layout.fl_pg_pool);
29 l.preferred_osd =
30 (s32)le32_to_cpu(ci->i_layout.fl_pg_preferred);
31 if (copy_to_user(arg, &l, sizeof(l)))
32 return -EFAULT;
33 }
34
35 return err;
36 }
37
ceph_ioctl_set_layout(struct file * file,void __user * arg)38 static long ceph_ioctl_set_layout(struct file *file, void __user *arg)
39 {
40 struct inode *inode = file->f_dentry->d_inode;
41 struct inode *parent_inode = file->f_dentry->d_parent->d_inode;
42 struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc;
43 struct ceph_mds_request *req;
44 struct ceph_ioctl_layout l;
45 int err, i;
46
47 /* copy and validate */
48 if (copy_from_user(&l, arg, sizeof(l)))
49 return -EFAULT;
50
51 if ((l.object_size & ~PAGE_MASK) ||
52 (l.stripe_unit & ~PAGE_MASK) ||
53 !l.stripe_unit ||
54 (l.object_size &&
55 (unsigned)l.object_size % (unsigned)l.stripe_unit))
56 return -EINVAL;
57
58 /* make sure it's a valid data pool */
59 if (l.data_pool > 0) {
60 mutex_lock(&mdsc->mutex);
61 err = -EINVAL;
62 for (i = 0; i < mdsc->mdsmap->m_num_data_pg_pools; i++)
63 if (mdsc->mdsmap->m_data_pg_pools[i] == l.data_pool) {
64 err = 0;
65 break;
66 }
67 mutex_unlock(&mdsc->mutex);
68 if (err)
69 return err;
70 }
71
72 req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETLAYOUT,
73 USE_AUTH_MDS);
74 if (IS_ERR(req))
75 return PTR_ERR(req);
76 req->r_inode = igrab(inode);
77 req->r_inode_drop = CEPH_CAP_FILE_SHARED | CEPH_CAP_FILE_EXCL;
78
79 req->r_args.setlayout.layout.fl_stripe_unit =
80 cpu_to_le32(l.stripe_unit);
81 req->r_args.setlayout.layout.fl_stripe_count =
82 cpu_to_le32(l.stripe_count);
83 req->r_args.setlayout.layout.fl_object_size =
84 cpu_to_le32(l.object_size);
85 req->r_args.setlayout.layout.fl_pg_pool = cpu_to_le32(l.data_pool);
86 req->r_args.setlayout.layout.fl_pg_preferred =
87 cpu_to_le32(l.preferred_osd);
88
89 err = ceph_mdsc_do_request(mdsc, parent_inode, req);
90 ceph_mdsc_put_request(req);
91 return err;
92 }
93
94 /*
95 * Set a layout policy on a directory inode. All items in the tree
96 * rooted at this inode will inherit this layout on creation,
97 * (It doesn't apply retroactively )
98 * unless a subdirectory has its own layout policy.
99 */
ceph_ioctl_set_layout_policy(struct file * file,void __user * arg)100 static long ceph_ioctl_set_layout_policy (struct file *file, void __user *arg)
101 {
102 struct inode *inode = file->f_dentry->d_inode;
103 struct ceph_mds_request *req;
104 struct ceph_ioctl_layout l;
105 int err, i;
106 struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc;
107
108 /* copy and validate */
109 if (copy_from_user(&l, arg, sizeof(l)))
110 return -EFAULT;
111
112 if ((l.object_size & ~PAGE_MASK) ||
113 (l.stripe_unit & ~PAGE_MASK) ||
114 !l.stripe_unit ||
115 (l.object_size &&
116 (unsigned)l.object_size % (unsigned)l.stripe_unit))
117 return -EINVAL;
118
119 /* make sure it's a valid data pool */
120 if (l.data_pool > 0) {
121 mutex_lock(&mdsc->mutex);
122 err = -EINVAL;
123 for (i = 0; i < mdsc->mdsmap->m_num_data_pg_pools; i++)
124 if (mdsc->mdsmap->m_data_pg_pools[i] == l.data_pool) {
125 err = 0;
126 break;
127 }
128 mutex_unlock(&mdsc->mutex);
129 if (err)
130 return err;
131 }
132
133 req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETDIRLAYOUT,
134 USE_AUTH_MDS);
135
136 if (IS_ERR(req))
137 return PTR_ERR(req);
138 req->r_inode = igrab(inode);
139
140 req->r_args.setlayout.layout.fl_stripe_unit =
141 cpu_to_le32(l.stripe_unit);
142 req->r_args.setlayout.layout.fl_stripe_count =
143 cpu_to_le32(l.stripe_count);
144 req->r_args.setlayout.layout.fl_object_size =
145 cpu_to_le32(l.object_size);
146 req->r_args.setlayout.layout.fl_pg_pool =
147 cpu_to_le32(l.data_pool);
148 req->r_args.setlayout.layout.fl_pg_preferred =
149 cpu_to_le32(l.preferred_osd);
150
151 err = ceph_mdsc_do_request(mdsc, inode, req);
152 ceph_mdsc_put_request(req);
153 return err;
154 }
155
156 /*
157 * Return object name, size/offset information, and location (OSD
158 * number, network address) for a given file offset.
159 */
ceph_ioctl_get_dataloc(struct file * file,void __user * arg)160 static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg)
161 {
162 struct ceph_ioctl_dataloc dl;
163 struct inode *inode = file->f_dentry->d_inode;
164 struct ceph_inode_info *ci = ceph_inode(inode);
165 struct ceph_osd_client *osdc =
166 &ceph_sb_to_client(inode->i_sb)->client->osdc;
167 u64 len = 1, olen;
168 u64 tmp;
169 struct ceph_object_layout ol;
170 struct ceph_pg pgid;
171
172 /* copy and validate */
173 if (copy_from_user(&dl, arg, sizeof(dl)))
174 return -EFAULT;
175
176 down_read(&osdc->map_sem);
177 ceph_calc_file_object_mapping(&ci->i_layout, dl.file_offset, &len,
178 &dl.object_no, &dl.object_offset, &olen);
179 dl.file_offset -= dl.object_offset;
180 dl.object_size = ceph_file_layout_object_size(ci->i_layout);
181 dl.block_size = ceph_file_layout_su(ci->i_layout);
182
183 /* block_offset = object_offset % block_size */
184 tmp = dl.object_offset;
185 dl.block_offset = do_div(tmp, dl.block_size);
186
187 snprintf(dl.object_name, sizeof(dl.object_name), "%llx.%08llx",
188 ceph_ino(inode), dl.object_no);
189 ceph_calc_object_layout(&ol, dl.object_name, &ci->i_layout,
190 osdc->osdmap);
191
192 pgid = ol.ol_pgid;
193 dl.osd = ceph_calc_pg_primary(osdc->osdmap, pgid);
194 if (dl.osd >= 0) {
195 struct ceph_entity_addr *a =
196 ceph_osd_addr(osdc->osdmap, dl.osd);
197 if (a)
198 memcpy(&dl.osd_addr, &a->in_addr, sizeof(dl.osd_addr));
199 } else {
200 memset(&dl.osd_addr, 0, sizeof(dl.osd_addr));
201 }
202 up_read(&osdc->map_sem);
203
204 /* send result back to user */
205 if (copy_to_user(arg, &dl, sizeof(dl)))
206 return -EFAULT;
207
208 return 0;
209 }
210
ceph_ioctl_lazyio(struct file * file)211 static long ceph_ioctl_lazyio(struct file *file)
212 {
213 struct ceph_file_info *fi = file->private_data;
214 struct inode *inode = file->f_dentry->d_inode;
215 struct ceph_inode_info *ci = ceph_inode(inode);
216
217 if ((fi->fmode & CEPH_FILE_MODE_LAZY) == 0) {
218 spin_lock(&inode->i_lock);
219 ci->i_nr_by_mode[fi->fmode]--;
220 fi->fmode |= CEPH_FILE_MODE_LAZY;
221 ci->i_nr_by_mode[fi->fmode]++;
222 spin_unlock(&inode->i_lock);
223 dout("ioctl_layzio: file %p marked lazy\n", file);
224
225 ceph_check_caps(ci, 0, NULL);
226 } else {
227 dout("ioctl_layzio: file %p already lazy\n", file);
228 }
229 return 0;
230 }
231
ceph_ioctl(struct file * file,unsigned int cmd,unsigned long arg)232 long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
233 {
234 dout("ioctl file %p cmd %u arg %lu\n", file, cmd, arg);
235 switch (cmd) {
236 case CEPH_IOC_GET_LAYOUT:
237 return ceph_ioctl_get_layout(file, (void __user *)arg);
238
239 case CEPH_IOC_SET_LAYOUT:
240 return ceph_ioctl_set_layout(file, (void __user *)arg);
241
242 case CEPH_IOC_SET_LAYOUT_POLICY:
243 return ceph_ioctl_set_layout_policy(file, (void __user *)arg);
244
245 case CEPH_IOC_GET_DATALOC:
246 return ceph_ioctl_get_dataloc(file, (void __user *)arg);
247
248 case CEPH_IOC_LAZYIO:
249 return ceph_ioctl_lazyio(file);
250 }
251
252 return -ENOTTY;
253 }
254