xref: /openbmc/qemu/hw/9pfs/9p.h (revision 95ee23ed2dd3f534a6b7038dbc1fb33a788d80f9)
1 #ifndef QEMU_9P_H
2 #define QEMU_9P_H
3 
4 #include <dirent.h>
5 #include <utime.h>
6 #include <sys/resource.h>
7 #include "fsdev/file-op-9p.h"
8 #include "fsdev/9p-iov-marshal.h"
9 #include "qemu/thread.h"
10 #include "qemu/coroutine.h"
11 #include "qemu/qht.h"
12 
13 enum {
14     P9_TLERROR = 6,
15     P9_RLERROR,
16     P9_TSTATFS = 8,
17     P9_RSTATFS,
18     P9_TLOPEN = 12,
19     P9_RLOPEN,
20     P9_TLCREATE = 14,
21     P9_RLCREATE,
22     P9_TSYMLINK = 16,
23     P9_RSYMLINK,
24     P9_TMKNOD = 18,
25     P9_RMKNOD,
26     P9_TRENAME = 20,
27     P9_RRENAME,
28     P9_TREADLINK = 22,
29     P9_RREADLINK,
30     P9_TGETATTR = 24,
31     P9_RGETATTR,
32     P9_TSETATTR = 26,
33     P9_RSETATTR,
34     P9_TXATTRWALK = 30,
35     P9_RXATTRWALK,
36     P9_TXATTRCREATE = 32,
37     P9_RXATTRCREATE,
38     P9_TREADDIR = 40,
39     P9_RREADDIR,
40     P9_TFSYNC = 50,
41     P9_RFSYNC,
42     P9_TLOCK = 52,
43     P9_RLOCK,
44     P9_TGETLOCK = 54,
45     P9_RGETLOCK,
46     P9_TLINK = 70,
47     P9_RLINK,
48     P9_TMKDIR = 72,
49     P9_RMKDIR,
50     P9_TRENAMEAT = 74,
51     P9_RRENAMEAT,
52     P9_TUNLINKAT = 76,
53     P9_RUNLINKAT,
54     P9_TVERSION = 100,
55     P9_RVERSION,
56     P9_TAUTH = 102,
57     P9_RAUTH,
58     P9_TATTACH = 104,
59     P9_RATTACH,
60     P9_TERROR = 106,
61     P9_RERROR,
62     P9_TFLUSH = 108,
63     P9_RFLUSH,
64     P9_TWALK = 110,
65     P9_RWALK,
66     P9_TOPEN = 112,
67     P9_ROPEN,
68     P9_TCREATE = 114,
69     P9_RCREATE,
70     P9_TREAD = 116,
71     P9_RREAD,
72     P9_TWRITE = 118,
73     P9_RWRITE,
74     P9_TCLUNK = 120,
75     P9_RCLUNK,
76     P9_TREMOVE = 122,
77     P9_RREMOVE,
78     P9_TSTAT = 124,
79     P9_RSTAT,
80     P9_TWSTAT = 126,
81     P9_RWSTAT,
82 };
83 
84 
85 /* qid.types */
86 enum {
87     P9_QTDIR = 0x80,
88     P9_QTAPPEND = 0x40,
89     P9_QTEXCL = 0x20,
90     P9_QTMOUNT = 0x10,
91     P9_QTAUTH = 0x08,
92     P9_QTTMP = 0x04,
93     P9_QTSYMLINK = 0x02,
94     P9_QTLINK = 0x01,
95     P9_QTFILE = 0x00,
96 };
97 
98 typedef enum P9ProtoVersion {
99     V9FS_PROTO_2000U = 0x01,
100     V9FS_PROTO_2000L = 0x02,
101 } P9ProtoVersion;
102 
103 /*
104  * Minimum message size supported by this 9pfs server.
105  *
106  * A client establishes a session by sending a Tversion request along with a
107  * 'msize' parameter which suggests the server a maximum message size ever to be
108  * used for communication (for both requests and replies) between client and
109  * server during that session. If client suggests a 'msize' smaller than this
110  * value then session is denied by server with an error response.
111  */
112 #define P9_MIN_MSIZE    4096
113 
114 #define P9_NOTAG    UINT16_MAX
115 #define P9_NOFID    UINT32_MAX
116 #define P9_MAXWELEM 16
117 
118 #define FID_REFERENCED          0x1
119 #define FID_NON_RECLAIMABLE     0x2
rpath(FsContext * ctx,const char * path)120 static inline char *rpath(FsContext *ctx, const char *path)
121 {
122     return g_strdup_printf("%s/%s", ctx->fs_root, path);
123 }
124 
125 /*
126  * ample room for Twrite/Rread header
127  * size[4] Tread/Twrite tag[2] fid[4] offset[8] count[4]
128  */
129 #define P9_IOHDRSZ 24
130 
131 typedef struct V9fsPDU V9fsPDU;
132 typedef struct V9fsState V9fsState;
133 typedef struct V9fsTransport V9fsTransport;
134 
135 typedef struct {
136     uint32_t size_le;
137     uint8_t id;
138     uint16_t tag_le;
139 } QEMU_PACKED P9MsgHeader;
140 /* According to the specification, 9p messages start with a 7-byte header.
141  * Since most of the code uses this header size in literal form, we must be
142  * sure this is indeed the case.
143  */
144 QEMU_BUILD_BUG_ON(sizeof(P9MsgHeader) != 7);
145 
146 struct V9fsPDU {
147     uint32_t size;
148     uint16_t tag;
149     uint8_t id;
150     uint8_t cancelled;
151     CoQueue complete;
152     V9fsState *s;
153     QLIST_ENTRY(V9fsPDU) next;
154     uint32_t idx;
155 };
156 
157 
158 /* FIXME
159  * 1) change user needs to set groups and stuff
160  */
161 
162 #define MAX_REQ         128
163 #define MAX_TAG_LEN     32
164 
165 #define BUG_ON(cond) assert(!(cond))
166 
167 typedef struct V9fsFidState V9fsFidState;
168 
169 enum {
170     P9_FID_NONE = 0,
171     P9_FID_FILE,
172     P9_FID_DIR,
173     P9_FID_XATTR,
174 };
175 
176 typedef struct V9fsConf
177 {
178     /* tag name for the device */
179     char *tag;
180     char *fsdev_id;
181 } V9fsConf;
182 
183 /* 9p2000.L xattr flags (matches Linux values) */
184 #define P9_XATTR_CREATE 1
185 #define P9_XATTR_REPLACE 2
186 
187 typedef struct V9fsXattr
188 {
189     uint64_t copied_len;
190     uint64_t len;
191     void *value;
192     V9fsString name;
193     int flags;
194     bool xattrwalk_fid;
195 } V9fsXattr;
196 
197 typedef struct V9fsDir {
198     DIR *stream;
199     P9ProtoVersion proto_version;
200     /* readdir mutex type used for 9P2000.u protocol variant */
201     CoMutex readdir_mutex_u;
202     /* readdir mutex type used for 9P2000.L protocol variant */
203     QemuMutex readdir_mutex_L;
204 } V9fsDir;
205 
v9fs_readdir_lock(V9fsDir * dir)206 static inline void coroutine_fn v9fs_readdir_lock(V9fsDir *dir)
207 {
208     if (dir->proto_version == V9FS_PROTO_2000U) {
209         qemu_co_mutex_lock(&dir->readdir_mutex_u);
210     } else {
211         qemu_mutex_lock(&dir->readdir_mutex_L);
212     }
213 }
214 
v9fs_readdir_unlock(V9fsDir * dir)215 static inline void coroutine_fn v9fs_readdir_unlock(V9fsDir *dir)
216 {
217     if (dir->proto_version == V9FS_PROTO_2000U) {
218         qemu_co_mutex_unlock(&dir->readdir_mutex_u);
219     } else {
220         qemu_mutex_unlock(&dir->readdir_mutex_L);
221     }
222 }
223 
v9fs_readdir_init(P9ProtoVersion proto_version,V9fsDir * dir)224 static inline void v9fs_readdir_init(P9ProtoVersion proto_version, V9fsDir *dir)
225 {
226     dir->proto_version = proto_version;
227     if (proto_version == V9FS_PROTO_2000U) {
228         qemu_co_mutex_init(&dir->readdir_mutex_u);
229     } else {
230         qemu_mutex_init(&dir->readdir_mutex_L);
231     }
232 }
233 
234 /*
235  * Type for 9p fs drivers' (a.k.a. 9p backends) result of readdir requests,
236  * which is a chained list of directory entries.
237  */
238 typedef struct V9fsDirEnt {
239     /* mandatory (must not be NULL) information for all readdir requests */
240     struct dirent *dent;
241     /*
242      * optional (may be NULL): A full stat of each directory entry is just
243      * done if explicitly told to fs driver.
244      */
245     struct stat *st;
246     /*
247      * instead of an array, directory entries are always returned as
248      * chained list, that's because the amount of entries retrieved by fs
249      * drivers is dependent on the individual entries' name (since response
250      * messages are size limited), so the final amount cannot be estimated
251      * before hand
252      */
253     struct V9fsDirEnt *next;
254 } V9fsDirEnt;
255 
256 /*
257  * Filled by fs driver on open and other
258  * calls.
259  */
260 union V9fsFidOpenState {
261     int fd;
262     V9fsDir dir;
263     V9fsXattr xattr;
264     /*
265      * private pointer for fs drivers, that
266      * have its own internal representation of
267      * open files.
268      */
269     void *private;
270 };
271 
272 struct V9fsFidState {
273     int fid_type;
274     int32_t fid;
275     V9fsPath path;
276     V9fsFidOpenState fs;
277     V9fsFidOpenState fs_reclaim;
278     int flags;
279     int open_flags;
280     uid_t uid;
281     int ref;
282     bool clunked;
283     QSLIST_ENTRY(V9fsFidState) reclaim_next;
284 };
285 
286 typedef enum AffixType_t {
287     AffixType_Prefix,
288     AffixType_Suffix, /* A.k.a. postfix. */
289 } AffixType_t;
290 
291 /*
292  * Unique affix of variable length.
293  *
294  * An affix is (currently) either a suffix or a prefix, which is either
295  * going to be prepended (prefix) or appended (suffix) with some other
296  * number for the goal to generate unique numbers. Accordingly the
297  * suffixes (or prefixes) we generate @b must all have the mathematical
298  * property of being suffix-free (or prefix-free in case of prefixes)
299  * so that no matter what number we concatenate the affix with, that we
300  * always reliably get unique numbers as result after concatenation.
301  */
302 typedef struct VariLenAffix {
303     AffixType_t type; /* Whether this affix is a suffix or a prefix. */
304     uint64_t value; /* Actual numerical value of this affix. */
305     /*
306      * Length of the affix, that is how many (of the lowest) bits of ``value``
307      * must be used for appending/prepending this affix to its final resulting,
308      * unique number.
309      */
310     int bits;
311 } VariLenAffix;
312 
313 /* See qid_inode_prefix_hash_bits(). */
314 typedef struct {
315     dev_t dev; /* FS device on host. */
316     /*
317      * How many (high) bits of the original inode number shall be used for
318      * hashing.
319      */
320     int prefix_bits;
321 } QpdEntry;
322 
323 /* QID path prefix entry, see stat_to_qid */
324 typedef struct {
325     dev_t dev;
326     uint16_t ino_prefix;
327     uint32_t qp_affix_index;
328     VariLenAffix qp_affix;
329 } QppEntry;
330 
331 /* QID path full entry, as above */
332 typedef struct {
333     dev_t dev;
334     ino_t ino;
335     uint64_t path;
336 } QpfEntry;
337 
338 struct V9fsState {
339     QLIST_HEAD(, V9fsPDU) free_list;
340     QLIST_HEAD(, V9fsPDU) active_list;
341     GHashTable *fids;
342     FileOperations *ops;
343     FsContext ctx;
344     char *tag;
345     P9ProtoVersion proto_version;
346     int32_t msize;
347     V9fsPDU pdus[MAX_REQ];
348     const V9fsTransport *transport;
349     /*
350      * lock ensuring atomic path update
351      * on rename.
352      */
353     CoRwlock rename_lock;
354     int32_t root_fid;
355     Error *migration_blocker;
356     V9fsConf fsconf;
357     struct stat root_st;
358     dev_t dev_id;
359     struct qht qpd_table;
360     struct qht qpp_table;
361     struct qht qpf_table;
362     uint64_t qp_ndevices; /* Amount of entries in qpd_table. */
363     uint16_t qp_affix_next;
364     uint64_t qp_fullpath_next;
365 };
366 
367 /* 9p2000.L open flags */
368 #define P9_DOTL_RDONLY        00000000
369 #define P9_DOTL_WRONLY        00000001
370 #define P9_DOTL_RDWR          00000002
371 #define P9_DOTL_NOACCESS      00000003
372 #define P9_DOTL_CREATE        00000100
373 #define P9_DOTL_EXCL          00000200
374 #define P9_DOTL_NOCTTY        00000400
375 #define P9_DOTL_TRUNC         00001000
376 #define P9_DOTL_APPEND        00002000
377 #define P9_DOTL_NONBLOCK      00004000
378 #define P9_DOTL_DSYNC         00010000
379 #define P9_DOTL_FASYNC        00020000
380 #define P9_DOTL_DIRECT        00040000
381 #define P9_DOTL_LARGEFILE     00100000
382 #define P9_DOTL_DIRECTORY     00200000
383 #define P9_DOTL_NOFOLLOW      00400000
384 #define P9_DOTL_NOATIME       01000000
385 #define P9_DOTL_CLOEXEC       02000000
386 #define P9_DOTL_SYNC          04000000
387 
388 /* 9p2000.L at flags */
389 #define P9_DOTL_AT_REMOVEDIR         0x200
390 
391 /* 9P2000.L lock type */
392 #define P9_LOCK_TYPE_RDLCK 0
393 #define P9_LOCK_TYPE_WRLCK 1
394 #define P9_LOCK_TYPE_UNLCK 2
395 
396 #define P9_LOCK_SUCCESS 0
397 #define P9_LOCK_BLOCKED 1
398 #define P9_LOCK_ERROR 2
399 #define P9_LOCK_GRACE 3
400 
401 #define P9_LOCK_FLAGS_BLOCK 1
402 #define P9_LOCK_FLAGS_RECLAIM 2
403 
404 typedef struct V9fsFlock
405 {
406     uint8_t type;
407     uint32_t flags;
408     uint64_t start; /* absolute offset */
409     uint64_t length;
410     uint32_t proc_id;
411     V9fsString client_id;
412 } V9fsFlock;
413 
414 typedef struct V9fsGetlock
415 {
416     uint8_t type;
417     uint64_t start; /* absolute offset */
418     uint64_t length;
419     uint32_t proc_id;
420     V9fsString client_id;
421 } V9fsGetlock;
422 
423 extern int open_fd_hw;
424 extern int total_open_fd;
425 
426 static inline void coroutine_fn
v9fs_path_write_lock(V9fsState * s)427 v9fs_path_write_lock(V9fsState *s)
428 {
429     if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) {
430         qemu_co_rwlock_wrlock(&s->rename_lock);
431     }
432 }
433 
434 static inline void coroutine_fn
v9fs_path_read_lock(V9fsState * s)435 v9fs_path_read_lock(V9fsState *s)
436 {
437     if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) {
438         qemu_co_rwlock_rdlock(&s->rename_lock);
439     }
440 }
441 
442 static inline void coroutine_fn
v9fs_path_unlock(V9fsState * s)443 v9fs_path_unlock(V9fsState *s)
444 {
445     if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) {
446         qemu_co_rwlock_unlock(&s->rename_lock);
447     }
448 }
449 
v9fs_request_cancelled(V9fsPDU * pdu)450 static inline uint8_t v9fs_request_cancelled(V9fsPDU *pdu)
451 {
452     return pdu->cancelled;
453 }
454 
455 void coroutine_fn v9fs_reclaim_fd(V9fsPDU *pdu);
456 void v9fs_path_init(V9fsPath *path);
457 void v9fs_path_free(V9fsPath *path);
458 void v9fs_path_sprintf(V9fsPath *path, const char *fmt, ...);
459 void v9fs_path_copy(V9fsPath *dst, const V9fsPath *src);
460 size_t v9fs_readdir_response_size(V9fsString *name);
461 int v9fs_name_to_path(V9fsState *s, V9fsPath *dirpath,
462                       const char *name, V9fsPath *path);
463 int v9fs_device_realize_common(V9fsState *s, const V9fsTransport *t,
464                                Error **errp);
465 void v9fs_device_unrealize_common(V9fsState *s);
466 
467 V9fsPDU *pdu_alloc(V9fsState *s);
468 void pdu_free(V9fsPDU *pdu);
469 void pdu_submit(V9fsPDU *pdu, P9MsgHeader *hdr);
470 void v9fs_reset(V9fsState *s);
471 
472 struct V9fsTransport {
473     ssize_t     (*pdu_vmarshal)(V9fsPDU *pdu, size_t offset, const char *fmt,
474                                 va_list ap);
475     ssize_t     (*pdu_vunmarshal)(V9fsPDU *pdu, size_t offset, const char *fmt,
476                                   va_list ap);
477     void        (*init_in_iov_from_pdu)(V9fsPDU *pdu, struct iovec **piov,
478                                         unsigned int *pniov, size_t size);
479     void        (*init_out_iov_from_pdu)(V9fsPDU *pdu, struct iovec **piov,
480                                          unsigned int *pniov, size_t size);
481     void        (*push_and_notify)(V9fsPDU *pdu);
482 };
483 
484 #endif
485