1 #ifndef QEMU_9P_H 2 #define QEMU_9P_H 3 4 #include <dirent.h> 5 #include <utime.h> 6 #include <sys/resource.h> 7 #include "fsdev/file-op-9p.h" 8 #include "fsdev/9p-iov-marshal.h" 9 #include "qemu/thread.h" 10 #include "qemu/coroutine.h" 11 #include "qemu/qht.h" 12 13 enum { 14 P9_TLERROR = 6, 15 P9_RLERROR, 16 P9_TSTATFS = 8, 17 P9_RSTATFS, 18 P9_TLOPEN = 12, 19 P9_RLOPEN, 20 P9_TLCREATE = 14, 21 P9_RLCREATE, 22 P9_TSYMLINK = 16, 23 P9_RSYMLINK, 24 P9_TMKNOD = 18, 25 P9_RMKNOD, 26 P9_TRENAME = 20, 27 P9_RRENAME, 28 P9_TREADLINK = 22, 29 P9_RREADLINK, 30 P9_TGETATTR = 24, 31 P9_RGETATTR, 32 P9_TSETATTR = 26, 33 P9_RSETATTR, 34 P9_TXATTRWALK = 30, 35 P9_RXATTRWALK, 36 P9_TXATTRCREATE = 32, 37 P9_RXATTRCREATE, 38 P9_TREADDIR = 40, 39 P9_RREADDIR, 40 P9_TFSYNC = 50, 41 P9_RFSYNC, 42 P9_TLOCK = 52, 43 P9_RLOCK, 44 P9_TGETLOCK = 54, 45 P9_RGETLOCK, 46 P9_TLINK = 70, 47 P9_RLINK, 48 P9_TMKDIR = 72, 49 P9_RMKDIR, 50 P9_TRENAMEAT = 74, 51 P9_RRENAMEAT, 52 P9_TUNLINKAT = 76, 53 P9_RUNLINKAT, 54 P9_TVERSION = 100, 55 P9_RVERSION, 56 P9_TAUTH = 102, 57 P9_RAUTH, 58 P9_TATTACH = 104, 59 P9_RATTACH, 60 P9_TERROR = 106, 61 P9_RERROR, 62 P9_TFLUSH = 108, 63 P9_RFLUSH, 64 P9_TWALK = 110, 65 P9_RWALK, 66 P9_TOPEN = 112, 67 P9_ROPEN, 68 P9_TCREATE = 114, 69 P9_RCREATE, 70 P9_TREAD = 116, 71 P9_RREAD, 72 P9_TWRITE = 118, 73 P9_RWRITE, 74 P9_TCLUNK = 120, 75 P9_RCLUNK, 76 P9_TREMOVE = 122, 77 P9_RREMOVE, 78 P9_TSTAT = 124, 79 P9_RSTAT, 80 P9_TWSTAT = 126, 81 P9_RWSTAT, 82 }; 83 84 85 /* qid.types */ 86 enum { 87 P9_QTDIR = 0x80, 88 P9_QTAPPEND = 0x40, 89 P9_QTEXCL = 0x20, 90 P9_QTMOUNT = 0x10, 91 P9_QTAUTH = 0x08, 92 P9_QTTMP = 0x04, 93 P9_QTSYMLINK = 0x02, 94 P9_QTLINK = 0x01, 95 P9_QTFILE = 0x00, 96 }; 97 98 typedef enum P9ProtoVersion { 99 V9FS_PROTO_2000U = 0x01, 100 V9FS_PROTO_2000L = 0x02, 101 } P9ProtoVersion; 102 103 /* 104 * Minimum message size supported by this 9pfs server. 105 * 106 * A client establishes a session by sending a Tversion request along with a 107 * 'msize' parameter which suggests the server a maximum message size ever to be 108 * used for communication (for both requests and replies) between client and 109 * server during that session. If client suggests a 'msize' smaller than this 110 * value then session is denied by server with an error response. 111 */ 112 #define P9_MIN_MSIZE 4096 113 114 #define P9_NOTAG UINT16_MAX 115 #define P9_NOFID UINT32_MAX 116 #define P9_MAXWELEM 16 117 118 #define FID_REFERENCED 0x1 119 #define FID_NON_RECLAIMABLE 0x2 120 static inline char *rpath(FsContext *ctx, const char *path) 121 { 122 return g_strdup_printf("%s/%s", ctx->fs_root, path); 123 } 124 125 /* 126 * ample room for Twrite/Rread header 127 * size[4] Tread/Twrite tag[2] fid[4] offset[8] count[4] 128 */ 129 #define P9_IOHDRSZ 24 130 131 typedef struct V9fsPDU V9fsPDU; 132 typedef struct V9fsState V9fsState; 133 typedef struct V9fsTransport V9fsTransport; 134 135 typedef struct { 136 uint32_t size_le; 137 uint8_t id; 138 uint16_t tag_le; 139 } QEMU_PACKED P9MsgHeader; 140 /* According to the specification, 9p messages start with a 7-byte header. 141 * Since most of the code uses this header size in literal form, we must be 142 * sure this is indeed the case. 143 */ 144 QEMU_BUILD_BUG_ON(sizeof(P9MsgHeader) != 7); 145 146 struct V9fsPDU { 147 uint32_t size; 148 uint16_t tag; 149 uint8_t id; 150 uint8_t cancelled; 151 CoQueue complete; 152 V9fsState *s; 153 QLIST_ENTRY(V9fsPDU) next; 154 uint32_t idx; 155 }; 156 157 158 /* FIXME 159 * 1) change user needs to set groups and stuff 160 */ 161 162 #define MAX_REQ 128 163 #define MAX_TAG_LEN 32 164 165 #define BUG_ON(cond) assert(!(cond)) 166 167 typedef struct V9fsFidState V9fsFidState; 168 169 enum { 170 P9_FID_NONE = 0, 171 P9_FID_FILE, 172 P9_FID_DIR, 173 P9_FID_XATTR, 174 }; 175 176 typedef struct V9fsConf 177 { 178 /* tag name for the device */ 179 char *tag; 180 char *fsdev_id; 181 } V9fsConf; 182 183 /* 9p2000.L xattr flags (matches Linux values) */ 184 #define P9_XATTR_CREATE 1 185 #define P9_XATTR_REPLACE 2 186 187 typedef struct V9fsXattr 188 { 189 uint64_t copied_len; 190 uint64_t len; 191 void *value; 192 V9fsString name; 193 int flags; 194 bool xattrwalk_fid; 195 } V9fsXattr; 196 197 typedef struct V9fsDir { 198 DIR *stream; 199 P9ProtoVersion proto_version; 200 /* readdir mutex type used for 9P2000.u protocol variant */ 201 CoMutex readdir_mutex_u; 202 /* readdir mutex type used for 9P2000.L protocol variant */ 203 QemuMutex readdir_mutex_L; 204 } V9fsDir; 205 206 static inline void v9fs_readdir_lock(V9fsDir *dir) 207 { 208 if (dir->proto_version == V9FS_PROTO_2000U) { 209 qemu_co_mutex_lock(&dir->readdir_mutex_u); 210 } else { 211 qemu_mutex_lock(&dir->readdir_mutex_L); 212 } 213 } 214 215 static inline void v9fs_readdir_unlock(V9fsDir *dir) 216 { 217 if (dir->proto_version == V9FS_PROTO_2000U) { 218 qemu_co_mutex_unlock(&dir->readdir_mutex_u); 219 } else { 220 qemu_mutex_unlock(&dir->readdir_mutex_L); 221 } 222 } 223 224 static inline void v9fs_readdir_init(P9ProtoVersion proto_version, V9fsDir *dir) 225 { 226 dir->proto_version = proto_version; 227 if (proto_version == V9FS_PROTO_2000U) { 228 qemu_co_mutex_init(&dir->readdir_mutex_u); 229 } else { 230 qemu_mutex_init(&dir->readdir_mutex_L); 231 } 232 } 233 234 /* 235 * Type for 9p fs drivers' (a.k.a. 9p backends) result of readdir requests, 236 * which is a chained list of directory entries. 237 */ 238 typedef struct V9fsDirEnt { 239 /* mandatory (must not be NULL) information for all readdir requests */ 240 struct dirent *dent; 241 /* 242 * optional (may be NULL): A full stat of each directory entry is just 243 * done if explicitly told to fs driver. 244 */ 245 struct stat *st; 246 /* 247 * instead of an array, directory entries are always returned as 248 * chained list, that's because the amount of entries retrieved by fs 249 * drivers is dependent on the individual entries' name (since response 250 * messages are size limited), so the final amount cannot be estimated 251 * before hand 252 */ 253 struct V9fsDirEnt *next; 254 } V9fsDirEnt; 255 256 /* 257 * Filled by fs driver on open and other 258 * calls. 259 */ 260 union V9fsFidOpenState { 261 int fd; 262 V9fsDir dir; 263 V9fsXattr xattr; 264 /* 265 * private pointer for fs drivers, that 266 * have its own internal representation of 267 * open files. 268 */ 269 void *private; 270 }; 271 272 struct V9fsFidState { 273 int fid_type; 274 int32_t fid; 275 V9fsPath path; 276 V9fsFidOpenState fs; 277 V9fsFidOpenState fs_reclaim; 278 int flags; 279 int open_flags; 280 uid_t uid; 281 int ref; 282 bool clunked; 283 QSIMPLEQ_ENTRY(V9fsFidState) next; 284 QSLIST_ENTRY(V9fsFidState) reclaim_next; 285 }; 286 287 typedef enum AffixType_t { 288 AffixType_Prefix, 289 AffixType_Suffix, /* A.k.a. postfix. */ 290 } AffixType_t; 291 292 /* 293 * Unique affix of variable length. 294 * 295 * An affix is (currently) either a suffix or a prefix, which is either 296 * going to be prepended (prefix) or appended (suffix) with some other 297 * number for the goal to generate unique numbers. Accordingly the 298 * suffixes (or prefixes) we generate @b must all have the mathematical 299 * property of being suffix-free (or prefix-free in case of prefixes) 300 * so that no matter what number we concatenate the affix with, that we 301 * always reliably get unique numbers as result after concatenation. 302 */ 303 typedef struct VariLenAffix { 304 AffixType_t type; /* Whether this affix is a suffix or a prefix. */ 305 uint64_t value; /* Actual numerical value of this affix. */ 306 /* 307 * Lenght of the affix, that is how many (of the lowest) bits of ``value`` 308 * must be used for appending/prepending this affix to its final resulting, 309 * unique number. 310 */ 311 int bits; 312 } VariLenAffix; 313 314 /* See qid_inode_prefix_hash_bits(). */ 315 typedef struct { 316 dev_t dev; /* FS device on host. */ 317 /* 318 * How many (high) bits of the original inode number shall be used for 319 * hashing. 320 */ 321 int prefix_bits; 322 } QpdEntry; 323 324 /* QID path prefix entry, see stat_to_qid */ 325 typedef struct { 326 dev_t dev; 327 uint16_t ino_prefix; 328 uint32_t qp_affix_index; 329 VariLenAffix qp_affix; 330 } QppEntry; 331 332 /* QID path full entry, as above */ 333 typedef struct { 334 dev_t dev; 335 ino_t ino; 336 uint64_t path; 337 } QpfEntry; 338 339 struct V9fsState { 340 QLIST_HEAD(, V9fsPDU) free_list; 341 QLIST_HEAD(, V9fsPDU) active_list; 342 QSIMPLEQ_HEAD(, V9fsFidState) fid_list; 343 FileOperations *ops; 344 FsContext ctx; 345 char *tag; 346 P9ProtoVersion proto_version; 347 int32_t msize; 348 V9fsPDU pdus[MAX_REQ]; 349 const V9fsTransport *transport; 350 /* 351 * lock ensuring atomic path update 352 * on rename. 353 */ 354 CoRwlock rename_lock; 355 int32_t root_fid; 356 Error *migration_blocker; 357 V9fsConf fsconf; 358 struct stat root_st; 359 dev_t dev_id; 360 struct qht qpd_table; 361 struct qht qpp_table; 362 struct qht qpf_table; 363 uint64_t qp_ndevices; /* Amount of entries in qpd_table. */ 364 uint16_t qp_affix_next; 365 uint64_t qp_fullpath_next; 366 }; 367 368 /* 9p2000.L open flags */ 369 #define P9_DOTL_RDONLY 00000000 370 #define P9_DOTL_WRONLY 00000001 371 #define P9_DOTL_RDWR 00000002 372 #define P9_DOTL_NOACCESS 00000003 373 #define P9_DOTL_CREATE 00000100 374 #define P9_DOTL_EXCL 00000200 375 #define P9_DOTL_NOCTTY 00000400 376 #define P9_DOTL_TRUNC 00001000 377 #define P9_DOTL_APPEND 00002000 378 #define P9_DOTL_NONBLOCK 00004000 379 #define P9_DOTL_DSYNC 00010000 380 #define P9_DOTL_FASYNC 00020000 381 #define P9_DOTL_DIRECT 00040000 382 #define P9_DOTL_LARGEFILE 00100000 383 #define P9_DOTL_DIRECTORY 00200000 384 #define P9_DOTL_NOFOLLOW 00400000 385 #define P9_DOTL_NOATIME 01000000 386 #define P9_DOTL_CLOEXEC 02000000 387 #define P9_DOTL_SYNC 04000000 388 389 /* 9p2000.L at flags */ 390 #define P9_DOTL_AT_REMOVEDIR 0x200 391 392 /* 9P2000.L lock type */ 393 #define P9_LOCK_TYPE_RDLCK 0 394 #define P9_LOCK_TYPE_WRLCK 1 395 #define P9_LOCK_TYPE_UNLCK 2 396 397 #define P9_LOCK_SUCCESS 0 398 #define P9_LOCK_BLOCKED 1 399 #define P9_LOCK_ERROR 2 400 #define P9_LOCK_GRACE 3 401 402 #define P9_LOCK_FLAGS_BLOCK 1 403 #define P9_LOCK_FLAGS_RECLAIM 2 404 405 typedef struct V9fsFlock 406 { 407 uint8_t type; 408 uint32_t flags; 409 uint64_t start; /* absolute offset */ 410 uint64_t length; 411 uint32_t proc_id; 412 V9fsString client_id; 413 } V9fsFlock; 414 415 typedef struct V9fsGetlock 416 { 417 uint8_t type; 418 uint64_t start; /* absolute offset */ 419 uint64_t length; 420 uint32_t proc_id; 421 V9fsString client_id; 422 } V9fsGetlock; 423 424 extern int open_fd_hw; 425 extern int total_open_fd; 426 427 static inline void v9fs_path_write_lock(V9fsState *s) 428 { 429 if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) { 430 qemu_co_rwlock_wrlock(&s->rename_lock); 431 } 432 } 433 434 static inline void v9fs_path_read_lock(V9fsState *s) 435 { 436 if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) { 437 qemu_co_rwlock_rdlock(&s->rename_lock); 438 } 439 } 440 441 static inline void v9fs_path_unlock(V9fsState *s) 442 { 443 if (s->ctx.export_flags & V9FS_PATHNAME_FSCONTEXT) { 444 qemu_co_rwlock_unlock(&s->rename_lock); 445 } 446 } 447 448 static inline uint8_t v9fs_request_cancelled(V9fsPDU *pdu) 449 { 450 return pdu->cancelled; 451 } 452 453 void coroutine_fn v9fs_reclaim_fd(V9fsPDU *pdu); 454 void v9fs_path_init(V9fsPath *path); 455 void v9fs_path_free(V9fsPath *path); 456 void v9fs_path_sprintf(V9fsPath *path, const char *fmt, ...); 457 void v9fs_path_copy(V9fsPath *dst, const V9fsPath *src); 458 size_t v9fs_readdir_response_size(V9fsString *name); 459 int v9fs_name_to_path(V9fsState *s, V9fsPath *dirpath, 460 const char *name, V9fsPath *path); 461 int v9fs_device_realize_common(V9fsState *s, const V9fsTransport *t, 462 Error **errp); 463 void v9fs_device_unrealize_common(V9fsState *s); 464 465 V9fsPDU *pdu_alloc(V9fsState *s); 466 void pdu_free(V9fsPDU *pdu); 467 void pdu_submit(V9fsPDU *pdu, P9MsgHeader *hdr); 468 void v9fs_reset(V9fsState *s); 469 470 struct V9fsTransport { 471 ssize_t (*pdu_vmarshal)(V9fsPDU *pdu, size_t offset, const char *fmt, 472 va_list ap); 473 ssize_t (*pdu_vunmarshal)(V9fsPDU *pdu, size_t offset, const char *fmt, 474 va_list ap); 475 void (*init_in_iov_from_pdu)(V9fsPDU *pdu, struct iovec **piov, 476 unsigned int *pniov, size_t size); 477 void (*init_out_iov_from_pdu)(V9fsPDU *pdu, struct iovec **piov, 478 unsigned int *pniov, size_t size); 479 void (*push_and_notify)(V9fsPDU *pdu); 480 }; 481 482 #if defined(XATTR_SIZE_MAX) 483 /* Linux */ 484 #define P9_XATTR_SIZE_MAX XATTR_SIZE_MAX 485 #elif defined(CONFIG_DARWIN) 486 /* 487 * Darwin doesn't seem to define a maximum xattr size in its user 488 * space header, so manually configure it across platforms as 64k. 489 * 490 * Having no limit at all can lead to QEMU crashing during large g_malloc() 491 * calls. Because QEMU does not currently support macOS guests, the below 492 * preliminary solution only works due to its being a reflection of the limit of 493 * Linux guests. 494 */ 495 #define P9_XATTR_SIZE_MAX 65536 496 #else 497 #error Missing definition for P9_XATTR_SIZE_MAX for this host system 498 #endif 499 500 #endif 501