1 #ifndef QEMU_9P_H 2 #define QEMU_9P_H 3 4 #include <dirent.h> 5 #include <utime.h> 6 #include <sys/resource.h> 7 #include "fsdev/file-op-9p.h" 8 #include "fsdev/9p-iov-marshal.h" 9 #include "qemu/thread.h" 10 #include "qemu/coroutine.h" 11 #include "qemu/qht.h" 12 13 enum { 14 P9_TLERROR = 6, 15 P9_RLERROR, 16 P9_TSTATFS = 8, 17 P9_RSTATFS, 18 P9_TLOPEN = 12, 19 P9_RLOPEN, 20 P9_TLCREATE = 14, 21 P9_RLCREATE, 22 P9_TSYMLINK = 16, 23 P9_RSYMLINK, 24 P9_TMKNOD = 18, 25 P9_RMKNOD, 26 P9_TRENAME = 20, 27 P9_RRENAME, 28 P9_TREADLINK = 22, 29 P9_RREADLINK, 30 P9_TGETATTR = 24, 31 P9_RGETATTR, 32 P9_TSETATTR = 26, 33 P9_RSETATTR, 34 P9_TXATTRWALK = 30, 35 P9_RXATTRWALK, 36 P9_TXATTRCREATE = 32, 37 P9_RXATTRCREATE, 38 P9_TREADDIR = 40, 39 P9_RREADDIR, 40 P9_TFSYNC = 50, 41 P9_RFSYNC, 42 P9_TLOCK = 52, 43 P9_RLOCK, 44 P9_TGETLOCK = 54, 45 P9_RGETLOCK, 46 P9_TLINK = 70, 47 P9_RLINK, 48 P9_TMKDIR = 72, 49 P9_RMKDIR, 50 P9_TRENAMEAT = 74, 51 P9_RRENAMEAT, 52 P9_TUNLINKAT = 76, 53 P9_RUNLINKAT, 54 P9_TVERSION = 100, 55 P9_RVERSION, 56 P9_TAUTH = 102, 57 P9_RAUTH, 58 P9_TATTACH = 104, 59 P9_RATTACH, 60 P9_TERROR = 106, 61 P9_RERROR, 62 P9_TFLUSH = 108, 63 P9_RFLUSH, 64 P9_TWALK = 110, 65 P9_RWALK, 66 P9_TOPEN = 112, 67 P9_ROPEN, 68 P9_TCREATE = 114, 69 P9_RCREATE, 70 P9_TREAD = 116, 71 P9_RREAD, 72 P9_TWRITE = 118, 73 P9_RWRITE, 74 P9_TCLUNK = 120, 75 P9_RCLUNK, 76 P9_TREMOVE = 122, 77 P9_RREMOVE, 78 P9_TSTAT = 124, 79 P9_RSTAT, 80 P9_TWSTAT = 126, 81 P9_RWSTAT, 82 }; 83 84 85 /* qid.types */ 86 enum { 87 P9_QTDIR = 0x80, 88 P9_QTAPPEND = 0x40, 89 P9_QTEXCL = 0x20, 90 P9_QTMOUNT = 0x10, 91 P9_QTAUTH = 0x08, 92 P9_QTTMP = 0x04, 93 P9_QTSYMLINK = 0x02, 94 P9_QTLINK = 0x01, 95 P9_QTFILE = 0x00, 96 }; 97 98 typedef enum P9ProtoVersion { 99 V9FS_PROTO_2000U = 0x01, 100 V9FS_PROTO_2000L = 0x02, 101 } P9ProtoVersion; 102 103 /* 104 * Minimum message size supported by this 9pfs server. 105 * 106 * A client establishes a session by sending a Tversion request along with a 107 * 'msize' parameter which suggests the server a maximum message size ever to be 108 * used for communication (for both requests and replies) between client and 109 * server during that session. If client suggests a 'msize' smaller than this 110 * value then session is denied by server with an error response. 111 */ 112 #define P9_MIN_MSIZE 4096 113 114 #define P9_NOTAG UINT16_MAX 115 #define P9_NOFID UINT32_MAX 116 #define P9_MAXWELEM 16 117 118 #define FID_REFERENCED 0x1 119 #define FID_NON_RECLAIMABLE 0x2 120 static inline char *rpath(FsContext *ctx, const char *path) 121 { 122 return g_strdup_printf("%s/%s", ctx->fs_root, path); 123 } 124 125 /* 126 * ample room for Twrite/Rread header 127 * size[4] Tread/Twrite tag[2] fid[4] offset[8] count[4] 128 */ 129 #define P9_IOHDRSZ 24 130 131 typedef struct V9fsPDU V9fsPDU; 132 typedef struct V9fsState V9fsState; 133 typedef struct V9fsTransport V9fsTransport; 134 135 typedef struct { 136 uint32_t size_le; 137 uint8_t id; 138 uint16_t tag_le; 139 } QEMU_PACKED P9MsgHeader; 140 /* According to the specification, 9p messages start with a 7-byte header. 141 * Since most of the code uses this header size in literal form, we must be 142 * sure this is indeed the case. 143 */ 144 QEMU_BUILD_BUG_ON(sizeof(P9MsgHeader) != 7); 145 146 struct V9fsPDU { 147 uint32_t size; 148 uint16_t tag; 149 uint8_t id; 150 uint8_t cancelled; 151 CoQueue complete; 152 V9fsState *s; 153 QLIST_ENTRY(V9fsPDU) next; 154 uint32_t idx; 155 }; 156 157 158 /* FIXME 159 * 1) change user needs to set groups and stuff 160 */ 161 162 #define MAX_REQ 128 163 #define MAX_TAG_LEN 32 164 165 #define BUG_ON(cond) assert(!(cond)) 166 167 typedef struct V9fsFidState V9fsFidState; 168 169 enum { 170 P9_FID_NONE = 0, 171 P9_FID_FILE, 172 P9_FID_DIR, 173 P9_FID_XATTR, 174 }; 175 176 typedef struct V9fsConf 177 { 178 /* tag name for the device */ 179 char *tag; 180 char *fsdev_id; 181 } V9fsConf; 182 183 /* 9p2000.L xattr flags (matches Linux values) */ 184 #define P9_XATTR_CREATE 1 185 #define P9_XATTR_REPLACE 2 186 187 typedef struct V9fsXattr 188 { 189 uint64_t copied_len; 190 uint64_t len; 191 void *value; 192 V9fsString name; 193 int flags; 194 bool xattrwalk_fid; 195 } V9fsXattr; 196 197 typedef struct V9fsDir { 198 DIR *stream; 199 P9ProtoVersion proto_version; 200 /* readdir mutex type used for 9P2000.u protocol variant */ 201 CoMutex readdir_mutex_u; 202 /* readdir mutex type used for 9P2000.L protocol variant */ 203 QemuMutex readdir_mutex_L; 204 } V9fsDir; 205 206 static inline void coroutine_fn v9fs_readdir_lock(V9fsDir *dir) 207 { 208 if (dir->proto_version == V9FS_PROTO_2000U) { 209 qemu_co_mutex_lock(&dir->readdir_mutex_u); 210 } else { 211 qemu_mutex_lock(&dir->readdir_mutex_L); 212 } 213 } 214 215 static inline void coroutine_fn v9fs_readdir_unlock(V9fsDir *dir) 216 { 217 if (dir->proto_version == V9FS_PROTO_2000U) { 218 qemu_co_mutex_unlock(&dir->readdir_mutex_u); 219 } else { 220 qemu_mutex_unlock(&dir->readdir_mutex_L); 221 } 222 } 223 224 static inline void v9fs_readdir_init(P9ProtoVersion proto_version, V9fsDir *dir) 225 { 226 dir->proto_version = proto_version; 227 if (proto_version == V9FS_PROTO_2000U) { 228 qemu_co_mutex_init(&dir->readdir_mutex_u); 229 } else { 230 qemu_mutex_init(&dir->readdir_mutex_L); 231 } 232 } 233 234 /* 235 * Type for 9p fs drivers' (a.k.a. 9p backends) result of readdir requests, 236 * which is a chained list of directory entries. 237 */ 238 typedef struct V9fsDirEnt { 239 /* mandatory (must not be NULL) information for all readdir requests */ 240 struct dirent *dent; 241 /* 242 * optional (may be NULL): A full stat of each directory entry is just 243 * done if explicitly told to fs driver. 244 */ 245 struct stat *st; 246 /* 247 * instead of an array, directory entries are always returned as 248 * chained list, that's because the amount of entries retrieved by fs 249 * drivers is dependent on the individual entries' name (since response 250 * messages are size limited), so the final amount cannot be estimated 251 * before hand 252 */ 253 struct V9fsDirEnt *next; 254 } V9fsDirEnt; 255 256 /* 257 * Filled by fs driver on open and other 258 * calls. 259 */ 260 union V9fsFidOpenState { 261 int fd; 262 V9fsDir dir; 263 V9fsXattr xattr; 264 /* 265 * private pointer for fs drivers, that 266 * have its own internal representation of 267 * open files. 268 */ 269 void *private; 270 }; 271 272 struct V9fsFidState { 273 int fid_type; 274 int32_t fid; 275 V9fsPath path; 276 V9fsFidOpenState fs; 277 V9fsFidOpenState fs_reclaim; 278 int flags; 279 int open_flags; 280 uid_t uid; 281 int ref; 282 bool clunked; 283 QSLIST_ENTRY(V9fsFidState) reclaim_next; 284 }; 285 286 typedef enum AffixType_t { 287 AffixType_Prefix, 288 AffixType_Suffix, /* A.k.a. postfix. */ 289 } AffixType_t; 290 291 /* 292 * Unique affix of variable length. 293 * 294 * An affix is (currently) either a suffix or a prefix, which is either 295 * going to be prepended (prefix) or appended (suffix) with some other 296 * number for the goal to generate unique numbers. Accordingly the 297 * suffixes (or prefixes) we generate @b must all have the mathematical 298 * property of being suffix-free (or prefix-free in case of prefixes) 299 * so that no matter what number we concatenate the affix with, that we 300 * always reliably get unique numbers as result after concatenation. 301 */ 302 typedef struct VariLenAffix { 303 AffixType_t type; /* Whether this affix is a suffix or a prefix. */ 304 uint64_t value; /* Actual numerical value of this affix. */ 305 /* 306 * Length of the affix, that is how many (of the lowest) bits of ``value`` 307 * must be used for appending/prepending this affix to its final resulting, 308 * unique number. 309 */ 310 int bits; 311 } VariLenAffix; 312 313 /* See qid_inode_prefix_hash_bits(). */ 314 typedef struct { 315 dev_t dev; /* FS device on host. */ 316 /* 317 * How many (high) bits of the original inode number shall be used for 318 * hashing. 319 */ 320 int prefix_bits; 321 } QpdEntry; 322 323 /* QID path prefix entry, see stat_to_qid */ 324 typedef struct { 325 dev_t dev; 326 uint16_t ino_prefix; 327 uint32_t qp_affix_index; 328 VariLenAffix qp_affix; 329 } QppEntry; 330 331 /* QID path full entry, as above */ 332 typedef struct { 333 dev_t dev; 334 ino_t ino; 335 uint64_t path; 336 } QpfEntry; 337 338 struct V9fsState { 339 QLIST_HEAD(, V9fsPDU) free_list; 340 QLIST_HEAD(, V9fsPDU) active_list; 341 GHashTable *fids; 342 FileOperations *ops; 343 FsContext ctx; 344 char *tag; 345 P9ProtoVersion proto_version; 346 int32_t msize; 347 V9fsPDU pdus[MAX_REQ]; 348 const V9fsTransport *transport; 349 /* 350 * lock ensuring atomic path update 351 * on rename. 352 */ 353 CoRwlock rename_lock; 354 int32_t root_fid; 355 Error *migration_blocker; 356 V9fsConf fsconf; 357 struct stat root_st; 358 dev_t dev_id; 359 struct qht qpd_table; 360 struct qht qpp_table; 361 struct qht qpf_table; 362 uint64_t qp_ndevices; /* Amount of entries in qpd_table. */ 363 uint16_t qp_affix_next; 364 uint64_t qp_fullpath_next; 365 }; 366 367 /* 9p2000.L open flags */ 368 #define P9_DOTL_RDONLY 00000000 369 #define P9_DOTL_WRONLY 00000001 370 #define P9_DOTL_RDWR 00000002 371 #define P9_DOTL_NOACCESS 00000003 372 #define P9_DOTL_CREATE 00000100 373 #define P9_DOTL_EXCL 00000200 374 #define P9_DOTL_NOCTTY 00000400 375 #define P9_DOTL_TRUNC 00001000 376 #define P9_DOTL_APPEND 00002000 377 #define P9_DOTL_NONBLOCK 00004000 378 #define P9_DOTL_DSYNC 00010000 379 #define P9_DOTL_FASYNC 00020000 380 #define P9_DOTL_DIRECT 00040000 381 #define P9_DOTL_LARGEFILE 00100000 382 #define P9_DOTL_DIRECTORY 00200000 383 #define P9_DOTL_NOFOLLOW 00400000 384 #define P9_DOTL_NOATIME 01000000 385 #define P9_DOTL_CLOEXEC 02000000 386 #define P9_DOTL_SYNC 04000000 387 388 /* 9p2000.L at flags */ 389 #define P9_DOTL_AT_REMOVEDIR 0x200 390 391 /* 9P2000.L lock type */ 392 #define P9_LOCK_TYPE_RDLCK 0 393 #define P9_LOCK_TYPE_WRLCK 1 394 #define P9_LOCK_TYPE_UNLCK 2 395 396 #define P9_LOCK_SUCCESS 0 397 #define P9_LOCK_BLOCKED 1 398 #define P9_LOCK_ERROR 2 399 #define P9_LOCK_GRACE 3 400 401 #define P9_LOCK_FLAGS_BLOCK 1 402 #define P9_LOCK_FLAGS_RECLAIM 2 403 404 typedef struct V9fsFlock 405 { 406 uint8_t type; 407 uint32_t flags; 408 uint64_t start; /* absolute offset */ 409 uint64_t length; 410 uint32_t proc_id; 411 V9fsString client_id; 412 } V9fsFlock; 413 414 typedef struct V9fsGetlock 415 { 416 uint8_t type; 417 uint64_t start; /* absolute offset */ 418 uint64_t length; 419 uint32_t proc_id; 420 V9fsString client_id; 421 } V9fsGetlock; 422 423 extern int open_fd_hw; 424 extern int total_open_fd; 425 426 static inline void coroutine_fn 427 v9fs_path_write_lock(V9fsState *s) 428 { 429 if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) { 430 qemu_co_rwlock_wrlock(&s->rename_lock); 431 } 432 } 433 434 static inline void coroutine_fn 435 v9fs_path_read_lock(V9fsState *s) 436 { 437 if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) { 438 qemu_co_rwlock_rdlock(&s->rename_lock); 439 } 440 } 441 442 static inline void coroutine_fn 443 v9fs_path_unlock(V9fsState *s) 444 { 445 if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) { 446 qemu_co_rwlock_unlock(&s->rename_lock); 447 } 448 } 449 450 static inline uint8_t v9fs_request_cancelled(V9fsPDU *pdu) 451 { 452 return pdu->cancelled; 453 } 454 455 void coroutine_fn v9fs_reclaim_fd(V9fsPDU *pdu); 456 void v9fs_path_init(V9fsPath *path); 457 void v9fs_path_free(V9fsPath *path); 458 void v9fs_path_sprintf(V9fsPath *path, const char *fmt, ...); 459 void v9fs_path_copy(V9fsPath *dst, const V9fsPath *src); 460 size_t v9fs_readdir_response_size(V9fsString *name); 461 int v9fs_name_to_path(V9fsState *s, V9fsPath *dirpath, 462 const char *name, V9fsPath *path); 463 int v9fs_device_realize_common(V9fsState *s, const V9fsTransport *t, 464 Error **errp); 465 void v9fs_device_unrealize_common(V9fsState *s); 466 467 V9fsPDU *pdu_alloc(V9fsState *s); 468 void pdu_free(V9fsPDU *pdu); 469 void pdu_submit(V9fsPDU *pdu, P9MsgHeader *hdr); 470 void v9fs_reset(V9fsState *s); 471 472 struct V9fsTransport { 473 ssize_t (*pdu_vmarshal)(V9fsPDU *pdu, size_t offset, const char *fmt, 474 va_list ap); 475 ssize_t (*pdu_vunmarshal)(V9fsPDU *pdu, size_t offset, const char *fmt, 476 va_list ap); 477 void (*init_in_iov_from_pdu)(V9fsPDU *pdu, struct iovec **piov, 478 unsigned int *pniov, size_t size); 479 void (*init_out_iov_from_pdu)(V9fsPDU *pdu, struct iovec **piov, 480 unsigned int *pniov, size_t size); 481 void (*push_and_notify)(V9fsPDU *pdu); 482 }; 483 484 #endif 485