devtmpfs.c 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442
  1. /*
  2. * devtmpfs - kernel-maintained tmpfs-based /dev
  3. *
  4. * Copyright (C) 2009, Kay Sievers <kay.sievers@vrfy.org>
  5. *
  6. * During bootup, before any driver core device is registered,
  7. * devtmpfs, a tmpfs-based filesystem is created. Every driver-core
  8. * device which requests a device node, will add a node in this
  9. * filesystem.
  10. * By default, all devices are named after the name of the device,
  11. * owned by root and have a default mode of 0600. Subsystems can
  12. * overwrite the default setting if needed.
  13. */
  14. #include <linux/kernel.h>
  15. #include <linux/syscalls.h>
  16. #include <linux/mount.h>
  17. #include <linux/device.h>
  18. #include <linux/genhd.h>
  19. #include <linux/namei.h>
  20. #include <linux/fs.h>
  21. #include <linux/shmem_fs.h>
  22. #include <linux/ramfs.h>
  23. #include <linux/sched.h>
  24. #include <linux/slab.h>
  25. #include <linux/kthread.h>
  26. static struct task_struct *thread;
  27. #if defined CONFIG_DEVTMPFS_MOUNT
  28. static int mount_dev = 1;
  29. #else
  30. static int mount_dev;
  31. #endif
  32. static DEFINE_SPINLOCK(req_lock);
  33. static struct req {
  34. struct req *next;
  35. struct completion done;
  36. int err;
  37. const char *name;
  38. umode_t mode; /* 0 => delete */
  39. uid_t uid;
  40. gid_t gid;
  41. struct device *dev;
  42. } *requests;
  43. static int __init mount_param(char *str)
  44. {
  45. mount_dev = simple_strtoul(str, NULL, 0);
  46. return 1;
  47. }
  48. __setup("devtmpfs.mount=", mount_param);
  49. static struct dentry *dev_mount(struct file_system_type *fs_type, int flags,
  50. const char *dev_name, void *data)
  51. {
  52. #ifdef CONFIG_TMPFS
  53. return mount_single(fs_type, flags, data, shmem_fill_super);
  54. #else
  55. return mount_single(fs_type, flags, data, ramfs_fill_super);
  56. #endif
  57. }
  58. static struct file_system_type dev_fs_type = {
  59. .name = "devtmpfs",
  60. .mount = dev_mount,
  61. .kill_sb = kill_litter_super,
  62. };
  63. #ifdef CONFIG_BLOCK
  64. static inline int is_blockdev(struct device *dev)
  65. {
  66. return dev->class == &block_class;
  67. }
  68. #else
  69. static inline int is_blockdev(struct device *dev) { return 0; }
  70. #endif
  71. int devtmpfs_create_node(struct device *dev)
  72. {
  73. const char *tmp = NULL;
  74. struct req req;
  75. if (!thread)
  76. return 0;
  77. req.mode = 0;
  78. req.uid = 0;
  79. req.gid = 0;
  80. req.name = device_get_devnode(dev, &req.mode, &req.uid, &req.gid, &tmp);
  81. if (!req.name)
  82. return -ENOMEM;
  83. if (req.mode == 0)
  84. req.mode = 0600;
  85. if (is_blockdev(dev))
  86. req.mode |= S_IFBLK;
  87. else
  88. req.mode |= S_IFCHR;
  89. req.dev = dev;
  90. init_completion(&req.done);
  91. spin_lock(&req_lock);
  92. req.next = requests;
  93. requests = &req;
  94. spin_unlock(&req_lock);
  95. wake_up_process(thread);
  96. wait_for_completion(&req.done);
  97. kfree(tmp);
  98. return req.err;
  99. }
  100. int devtmpfs_delete_node(struct device *dev)
  101. {
  102. const char *tmp = NULL;
  103. struct req req;
  104. if (!thread)
  105. return 0;
  106. req.name = device_get_devnode(dev, NULL, NULL, NULL, &tmp);
  107. if (!req.name)
  108. return -ENOMEM;
  109. req.mode = 0;
  110. req.dev = dev;
  111. init_completion(&req.done);
  112. spin_lock(&req_lock);
  113. req.next = requests;
  114. requests = &req;
  115. spin_unlock(&req_lock);
  116. wake_up_process(thread);
  117. wait_for_completion(&req.done);
  118. kfree(tmp);
  119. return req.err;
  120. }
  121. static int dev_mkdir(const char *name, umode_t mode)
  122. {
  123. struct dentry *dentry;
  124. struct path path;
  125. int err;
  126. dentry = kern_path_create(AT_FDCWD, name, &path, LOOKUP_DIRECTORY);
  127. if (IS_ERR(dentry))
  128. return PTR_ERR(dentry);
  129. err = vfs_mkdir(path.dentry->d_inode, dentry, mode);
  130. if (!err)
  131. /* mark as kernel-created inode */
  132. dentry->d_inode->i_private = &thread;
  133. done_path_create(&path, dentry);
  134. return err;
  135. }
  136. static int create_path(const char *nodepath)
  137. {
  138. char *path;
  139. char *s;
  140. int err = 0;
  141. /* parent directories do not exist, create them */
  142. path = kstrdup(nodepath, GFP_KERNEL);
  143. if (!path)
  144. return -ENOMEM;
  145. s = path;
  146. for (;;) {
  147. s = strchr(s, '/');
  148. if (!s)
  149. break;
  150. s[0] = '\0';
  151. err = dev_mkdir(path, 0755);
  152. if (err && err != -EEXIST)
  153. break;
  154. s[0] = '/';
  155. s++;
  156. }
  157. kfree(path);
  158. return err;
  159. }
  160. static int handle_create(const char *nodename, umode_t mode, uid_t uid,
  161. gid_t gid, struct device *dev)
  162. {
  163. struct dentry *dentry;
  164. struct path path;
  165. int err;
  166. dentry = kern_path_create(AT_FDCWD, nodename, &path, 0);
  167. if (dentry == ERR_PTR(-ENOENT)) {
  168. create_path(nodename);
  169. dentry = kern_path_create(AT_FDCWD, nodename, &path, 0);
  170. }
  171. if (IS_ERR(dentry))
  172. return PTR_ERR(dentry);
  173. err = vfs_mknod(path.dentry->d_inode, dentry, mode, dev->devt);
  174. if (!err) {
  175. struct iattr newattrs;
  176. newattrs.ia_mode = mode;
  177. newattrs.ia_uid = uid;
  178. newattrs.ia_gid = gid;
  179. newattrs.ia_valid = ATTR_MODE|ATTR_UID|ATTR_GID;
  180. mutex_lock(&dentry->d_inode->i_mutex);
  181. notify_change(dentry, &newattrs);
  182. mutex_unlock(&dentry->d_inode->i_mutex);
  183. /* mark as kernel-created inode */
  184. dentry->d_inode->i_private = &thread;
  185. }
  186. done_path_create(&path, dentry);
  187. return err;
  188. }
  189. static int dev_rmdir(const char *name)
  190. {
  191. struct path parent;
  192. struct dentry *dentry;
  193. int err;
  194. dentry = kern_path_locked(name, &parent);
  195. if (IS_ERR(dentry))
  196. return PTR_ERR(dentry);
  197. if (dentry->d_inode) {
  198. if (dentry->d_inode->i_private == &thread)
  199. err = vfs_rmdir(parent.dentry->d_inode, dentry);
  200. else
  201. err = -EPERM;
  202. } else {
  203. err = -ENOENT;
  204. }
  205. dput(dentry);
  206. mutex_unlock(&parent.dentry->d_inode->i_mutex);
  207. path_put(&parent);
  208. return err;
  209. }
  210. static int delete_path(const char *nodepath)
  211. {
  212. const char *path;
  213. int err = 0;
  214. path = kstrdup(nodepath, GFP_KERNEL);
  215. if (!path)
  216. return -ENOMEM;
  217. for (;;) {
  218. char *base;
  219. base = strrchr(path, '/');
  220. if (!base)
  221. break;
  222. base[0] = '\0';
  223. err = dev_rmdir(path);
  224. if (err)
  225. break;
  226. }
  227. kfree(path);
  228. return err;
  229. }
  230. static int dev_mynode(struct device *dev, struct inode *inode, struct kstat *stat)
  231. {
  232. /* did we create it */
  233. if (inode->i_private != &thread)
  234. return 0;
  235. /* does the dev_t match */
  236. if (is_blockdev(dev)) {
  237. if (!S_ISBLK(stat->mode))
  238. return 0;
  239. } else {
  240. if (!S_ISCHR(stat->mode))
  241. return 0;
  242. }
  243. if (stat->rdev != dev->devt)
  244. return 0;
  245. /* ours */
  246. return 1;
  247. }
  248. static int handle_remove(const char *nodename, struct device *dev)
  249. {
  250. struct path parent;
  251. struct dentry *dentry;
  252. int deleted = 1;
  253. int err;
  254. dentry = kern_path_locked(nodename, &parent);
  255. if (IS_ERR(dentry))
  256. return PTR_ERR(dentry);
  257. if (dentry->d_inode) {
  258. struct kstat stat;
  259. struct path p = {.mnt = parent.mnt, .dentry = dentry};
  260. err = vfs_getattr(&p, &stat);
  261. if (!err && dev_mynode(dev, dentry->d_inode, &stat)) {
  262. struct iattr newattrs;
  263. /*
  264. * before unlinking this node, reset permissions
  265. * of possible references like hardlinks
  266. */
  267. newattrs.ia_uid = GLOBAL_ROOT_UID;
  268. newattrs.ia_gid = GLOBAL_ROOT_GID;
  269. newattrs.ia_mode = stat.mode & ~0777;
  270. newattrs.ia_valid =
  271. ATTR_UID|ATTR_GID|ATTR_MODE;
  272. mutex_lock(&dentry->d_inode->i_mutex);
  273. notify_change(dentry, &newattrs);
  274. mutex_unlock(&dentry->d_inode->i_mutex);
  275. err = vfs_unlink(parent.dentry->d_inode, dentry);
  276. if (!err || err == -ENOENT)
  277. deleted = 1;
  278. }
  279. } else {
  280. err = -ENOENT;
  281. }
  282. dput(dentry);
  283. mutex_unlock(&parent.dentry->d_inode->i_mutex);
  284. path_put(&parent);
  285. if (deleted && strchr(nodename, '/'))
  286. delete_path(nodename);
  287. return err;
  288. }
  289. /*
  290. * If configured, or requested by the commandline, devtmpfs will be
  291. * auto-mounted after the kernel mounted the root filesystem.
  292. */
  293. int devtmpfs_mount(const char *mntdir)
  294. {
  295. int err;
  296. if (!mount_dev)
  297. return 0;
  298. if (!thread)
  299. return 0;
  300. err = sys_mount("devtmpfs", (char *)mntdir, "devtmpfs", MS_SILENT, NULL);
  301. if (err)
  302. printk(KERN_INFO "devtmpfs: error mounting %i\n", err);
  303. else
  304. printk(KERN_INFO "devtmpfs: mounted\n");
  305. return err;
  306. }
  307. static DECLARE_COMPLETION(setup_done);
  308. static int handle(const char *name, umode_t mode, uid_t uid, gid_t gid,
  309. struct device *dev)
  310. {
  311. if (mode)
  312. return handle_create(name, mode, uid, gid, dev);
  313. else
  314. return handle_remove(name, dev);
  315. }
  316. static int devtmpfsd(void *p)
  317. {
  318. char options[] = "mode=0755";
  319. int *err = p;
  320. *err = sys_unshare(CLONE_NEWNS);
  321. if (*err)
  322. goto out;
  323. *err = sys_mount("devtmpfs", "/", "devtmpfs", MS_SILENT, options);
  324. if (*err)
  325. goto out;
  326. sys_chdir("/.."); /* will traverse into overmounted root */
  327. sys_chroot(".");
  328. complete(&setup_done);
  329. while (1) {
  330. spin_lock(&req_lock);
  331. while (requests) {
  332. struct req *req = requests;
  333. requests = NULL;
  334. spin_unlock(&req_lock);
  335. while (req) {
  336. struct req *next = req->next;
  337. req->err = handle(req->name, req->mode,
  338. req->uid, req->gid, req->dev);
  339. complete(&req->done);
  340. req = next;
  341. }
  342. spin_lock(&req_lock);
  343. }
  344. __set_current_state(TASK_INTERRUPTIBLE);
  345. spin_unlock(&req_lock);
  346. schedule();
  347. }
  348. return 0;
  349. out:
  350. complete(&setup_done);
  351. return *err;
  352. }
  353. /*
  354. * Create devtmpfs instance, driver-core devices will add their device
  355. * nodes here.
  356. */
  357. int __init devtmpfs_init(void)
  358. {
  359. int err = register_filesystem(&dev_fs_type);
  360. if (err) {
  361. printk(KERN_ERR "devtmpfs: unable to register devtmpfs "
  362. "type %i\n", err);
  363. return err;
  364. }
  365. thread = kthread_run(devtmpfsd, &err, "kdevtmpfs");
  366. if (!IS_ERR(thread)) {
  367. wait_for_completion(&setup_done);
  368. } else {
  369. err = PTR_ERR(thread);
  370. thread = NULL;
  371. }
  372. if (err) {
  373. printk(KERN_ERR "devtmpfs: unable to create devtmpfs %i\n", err);
  374. unregister_filesystem(&dev_fs_type);
  375. return err;
  376. }
  377. printk(KERN_INFO "devtmpfs: initialized\n");
  378. return 0;
  379. }