dir.c 25 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115
  1. /*
  2. *
  3. * Copyright (C) 2011 Novell Inc.
  4. *
  5. * This program is free software; you can redistribute it and/or modify it
  6. * under the terms of the GNU General Public License version 2 as published by
  7. * the Free Software Foundation.
  8. */
  9. #include <linux/fs.h>
  10. #include <linux/namei.h>
  11. #include <linux/xattr.h>
  12. #include <linux/security.h>
  13. #include <linux/cred.h>
  14. #include <linux/module.h>
  15. #include <linux/posix_acl.h>
  16. #include <linux/posix_acl_xattr.h>
  17. #include <linux/atomic.h>
  18. #include <linux/ratelimit.h>
  19. #include "overlayfs.h"
  20. static unsigned short ovl_redirect_max = 256;
  21. module_param_named(redirect_max, ovl_redirect_max, ushort, 0644);
  22. MODULE_PARM_DESC(ovl_redirect_max,
  23. "Maximum length of absolute redirect xattr value");
  24. int ovl_cleanup(struct inode *wdir, struct dentry *wdentry)
  25. {
  26. int err;
  27. dget(wdentry);
  28. if (d_is_dir(wdentry))
  29. err = ovl_do_rmdir(wdir, wdentry);
  30. else
  31. err = ovl_do_unlink(wdir, wdentry);
  32. dput(wdentry);
  33. if (err) {
  34. pr_err("overlayfs: cleanup of '%pd2' failed (%i)\n",
  35. wdentry, err);
  36. }
  37. return err;
  38. }
  39. struct dentry *ovl_lookup_temp(struct dentry *workdir)
  40. {
  41. struct dentry *temp;
  42. char name[20];
  43. static atomic_t temp_id = ATOMIC_INIT(0);
  44. /* counter is allowed to wrap, since temp dentries are ephemeral */
  45. snprintf(name, sizeof(name), "#%x", atomic_inc_return(&temp_id));
  46. temp = lookup_one_len(name, workdir, strlen(name));
  47. if (!IS_ERR(temp) && temp->d_inode) {
  48. pr_err("overlayfs: workdir/%s already exists\n", name);
  49. dput(temp);
  50. temp = ERR_PTR(-EIO);
  51. }
  52. return temp;
  53. }
  54. /* caller holds i_mutex on workdir */
  55. static struct dentry *ovl_whiteout(struct dentry *workdir)
  56. {
  57. int err;
  58. struct dentry *whiteout;
  59. struct inode *wdir = workdir->d_inode;
  60. whiteout = ovl_lookup_temp(workdir);
  61. if (IS_ERR(whiteout))
  62. return whiteout;
  63. err = ovl_do_whiteout(wdir, whiteout);
  64. if (err) {
  65. dput(whiteout);
  66. whiteout = ERR_PTR(err);
  67. }
  68. return whiteout;
  69. }
  70. /* Caller must hold i_mutex on both workdir and dir */
  71. int ovl_cleanup_and_whiteout(struct dentry *workdir, struct inode *dir,
  72. struct dentry *dentry)
  73. {
  74. struct inode *wdir = workdir->d_inode;
  75. struct dentry *whiteout;
  76. int err;
  77. int flags = 0;
  78. whiteout = ovl_whiteout(workdir);
  79. err = PTR_ERR(whiteout);
  80. if (IS_ERR(whiteout))
  81. return err;
  82. if (d_is_dir(dentry))
  83. flags = RENAME_EXCHANGE;
  84. err = ovl_do_rename(wdir, whiteout, dir, dentry, flags);
  85. if (err)
  86. goto kill_whiteout;
  87. if (flags)
  88. ovl_cleanup(wdir, dentry);
  89. out:
  90. dput(whiteout);
  91. return err;
  92. kill_whiteout:
  93. ovl_cleanup(wdir, whiteout);
  94. goto out;
  95. }
  96. int ovl_create_real(struct inode *dir, struct dentry *newdentry,
  97. struct cattr *attr, struct dentry *hardlink, bool debug)
  98. {
  99. int err;
  100. if (newdentry->d_inode)
  101. return -ESTALE;
  102. if (hardlink) {
  103. err = ovl_do_link(hardlink, dir, newdentry, debug);
  104. } else {
  105. switch (attr->mode & S_IFMT) {
  106. case S_IFREG:
  107. err = ovl_do_create(dir, newdentry, attr->mode, debug);
  108. break;
  109. case S_IFDIR:
  110. err = ovl_do_mkdir(dir, newdentry, attr->mode, debug);
  111. break;
  112. case S_IFCHR:
  113. case S_IFBLK:
  114. case S_IFIFO:
  115. case S_IFSOCK:
  116. err = ovl_do_mknod(dir, newdentry,
  117. attr->mode, attr->rdev, debug);
  118. break;
  119. case S_IFLNK:
  120. err = ovl_do_symlink(dir, newdentry, attr->link, debug);
  121. break;
  122. default:
  123. err = -EPERM;
  124. }
  125. }
  126. if (!err && WARN_ON(!newdentry->d_inode)) {
  127. /*
  128. * Not quite sure if non-instantiated dentry is legal or not.
  129. * VFS doesn't seem to care so check and warn here.
  130. */
  131. err = -ENOENT;
  132. }
  133. return err;
  134. }
  135. static int ovl_set_opaque_xerr(struct dentry *dentry, struct dentry *upper,
  136. int xerr)
  137. {
  138. int err;
  139. err = ovl_check_setxattr(dentry, upper, OVL_XATTR_OPAQUE, "y", 1, xerr);
  140. if (!err)
  141. ovl_dentry_set_opaque(dentry);
  142. return err;
  143. }
  144. static int ovl_set_opaque(struct dentry *dentry, struct dentry *upperdentry)
  145. {
  146. /*
  147. * Fail with -EIO when trying to create opaque dir and upper doesn't
  148. * support xattrs. ovl_rename() calls ovl_set_opaque_xerr(-EXDEV) to
  149. * return a specific error for noxattr case.
  150. */
  151. return ovl_set_opaque_xerr(dentry, upperdentry, -EIO);
  152. }
  153. /* Common operations required to be done after creation of file on upper */
  154. static void ovl_instantiate(struct dentry *dentry, struct inode *inode,
  155. struct dentry *newdentry, bool hardlink)
  156. {
  157. ovl_dentry_version_inc(dentry->d_parent, false);
  158. ovl_dentry_set_upper_alias(dentry);
  159. if (!hardlink) {
  160. ovl_inode_update(inode, newdentry);
  161. ovl_copyattr(newdentry->d_inode, inode);
  162. } else {
  163. WARN_ON(ovl_inode_real(inode) != d_inode(newdentry));
  164. dput(newdentry);
  165. inc_nlink(inode);
  166. }
  167. d_instantiate(dentry, inode);
  168. /* Force lookup of new upper hardlink to find its lower */
  169. if (hardlink)
  170. d_drop(dentry);
  171. }
  172. static bool ovl_type_merge(struct dentry *dentry)
  173. {
  174. return OVL_TYPE_MERGE(ovl_path_type(dentry));
  175. }
  176. static bool ovl_type_origin(struct dentry *dentry)
  177. {
  178. return OVL_TYPE_ORIGIN(ovl_path_type(dentry));
  179. }
  180. static int ovl_create_upper(struct dentry *dentry, struct inode *inode,
  181. struct cattr *attr, struct dentry *hardlink)
  182. {
  183. struct dentry *upperdir = ovl_dentry_upper(dentry->d_parent);
  184. struct inode *udir = upperdir->d_inode;
  185. struct dentry *newdentry;
  186. int err;
  187. if (!hardlink && !IS_POSIXACL(udir))
  188. attr->mode &= ~current_umask();
  189. inode_lock_nested(udir, I_MUTEX_PARENT);
  190. newdentry = lookup_one_len(dentry->d_name.name, upperdir,
  191. dentry->d_name.len);
  192. err = PTR_ERR(newdentry);
  193. if (IS_ERR(newdentry))
  194. goto out_unlock;
  195. err = ovl_create_real(udir, newdentry, attr, hardlink, false);
  196. if (err)
  197. goto out_dput;
  198. if (ovl_type_merge(dentry->d_parent) && d_is_dir(newdentry)) {
  199. /* Setting opaque here is just an optimization, allow to fail */
  200. ovl_set_opaque(dentry, newdentry);
  201. }
  202. ovl_instantiate(dentry, inode, newdentry, !!hardlink);
  203. newdentry = NULL;
  204. out_dput:
  205. dput(newdentry);
  206. out_unlock:
  207. inode_unlock(udir);
  208. return err;
  209. }
  210. static struct dentry *ovl_clear_empty(struct dentry *dentry,
  211. struct list_head *list)
  212. {
  213. struct dentry *workdir = ovl_workdir(dentry);
  214. struct inode *wdir = workdir->d_inode;
  215. struct dentry *upperdir = ovl_dentry_upper(dentry->d_parent);
  216. struct inode *udir = upperdir->d_inode;
  217. struct path upperpath;
  218. struct dentry *upper;
  219. struct dentry *opaquedir;
  220. struct kstat stat;
  221. int err;
  222. if (WARN_ON(!workdir))
  223. return ERR_PTR(-EROFS);
  224. err = ovl_lock_rename_workdir(workdir, upperdir);
  225. if (err)
  226. goto out;
  227. ovl_path_upper(dentry, &upperpath);
  228. err = vfs_getattr(&upperpath, &stat,
  229. STATX_BASIC_STATS, AT_STATX_SYNC_AS_STAT);
  230. if (err)
  231. goto out_unlock;
  232. err = -ESTALE;
  233. if (!S_ISDIR(stat.mode))
  234. goto out_unlock;
  235. upper = upperpath.dentry;
  236. if (upper->d_parent->d_inode != udir)
  237. goto out_unlock;
  238. opaquedir = ovl_lookup_temp(workdir);
  239. err = PTR_ERR(opaquedir);
  240. if (IS_ERR(opaquedir))
  241. goto out_unlock;
  242. err = ovl_create_real(wdir, opaquedir,
  243. &(struct cattr){.mode = stat.mode}, NULL, true);
  244. if (err)
  245. goto out_dput;
  246. err = ovl_copy_xattr(upper, opaquedir);
  247. if (err)
  248. goto out_cleanup;
  249. err = ovl_set_opaque(dentry, opaquedir);
  250. if (err)
  251. goto out_cleanup;
  252. inode_lock(opaquedir->d_inode);
  253. err = ovl_set_attr(opaquedir, &stat);
  254. inode_unlock(opaquedir->d_inode);
  255. if (err)
  256. goto out_cleanup;
  257. err = ovl_do_rename(wdir, opaquedir, udir, upper, RENAME_EXCHANGE);
  258. if (err)
  259. goto out_cleanup;
  260. ovl_cleanup_whiteouts(upper, list);
  261. ovl_cleanup(wdir, upper);
  262. unlock_rename(workdir, upperdir);
  263. /* dentry's upper doesn't match now, get rid of it */
  264. d_drop(dentry);
  265. return opaquedir;
  266. out_cleanup:
  267. ovl_cleanup(wdir, opaquedir);
  268. out_dput:
  269. dput(opaquedir);
  270. out_unlock:
  271. unlock_rename(workdir, upperdir);
  272. out:
  273. return ERR_PTR(err);
  274. }
  275. static int ovl_set_upper_acl(struct dentry *upperdentry, const char *name,
  276. const struct posix_acl *acl)
  277. {
  278. void *buffer;
  279. size_t size;
  280. int err;
  281. if (!IS_ENABLED(CONFIG_FS_POSIX_ACL) || !acl)
  282. return 0;
  283. size = posix_acl_to_xattr(NULL, acl, NULL, 0);
  284. buffer = kmalloc(size, GFP_KERNEL);
  285. if (!buffer)
  286. return -ENOMEM;
  287. size = posix_acl_to_xattr(&init_user_ns, acl, buffer, size);
  288. err = size;
  289. if (err < 0)
  290. goto out_free;
  291. err = vfs_setxattr(upperdentry, name, buffer, size, XATTR_CREATE);
  292. out_free:
  293. kfree(buffer);
  294. return err;
  295. }
  296. static int ovl_create_over_whiteout(struct dentry *dentry, struct inode *inode,
  297. struct cattr *cattr,
  298. struct dentry *hardlink)
  299. {
  300. struct dentry *workdir = ovl_workdir(dentry);
  301. struct inode *wdir = workdir->d_inode;
  302. struct dentry *upperdir = ovl_dentry_upper(dentry->d_parent);
  303. struct inode *udir = upperdir->d_inode;
  304. struct dentry *upper;
  305. struct dentry *newdentry;
  306. int err;
  307. struct posix_acl *acl, *default_acl;
  308. if (WARN_ON(!workdir))
  309. return -EROFS;
  310. if (!hardlink) {
  311. err = posix_acl_create(dentry->d_parent->d_inode,
  312. &cattr->mode, &default_acl, &acl);
  313. if (err)
  314. return err;
  315. }
  316. err = ovl_lock_rename_workdir(workdir, upperdir);
  317. if (err)
  318. goto out;
  319. newdentry = ovl_lookup_temp(workdir);
  320. err = PTR_ERR(newdentry);
  321. if (IS_ERR(newdentry))
  322. goto out_unlock;
  323. upper = lookup_one_len(dentry->d_name.name, upperdir,
  324. dentry->d_name.len);
  325. err = PTR_ERR(upper);
  326. if (IS_ERR(upper))
  327. goto out_dput;
  328. err = ovl_create_real(wdir, newdentry, cattr, hardlink, true);
  329. if (err)
  330. goto out_dput2;
  331. /*
  332. * mode could have been mutilated due to umask (e.g. sgid directory)
  333. */
  334. if (!hardlink &&
  335. !S_ISLNK(cattr->mode) &&
  336. newdentry->d_inode->i_mode != cattr->mode) {
  337. struct iattr attr = {
  338. .ia_valid = ATTR_MODE,
  339. .ia_mode = cattr->mode,
  340. };
  341. inode_lock(newdentry->d_inode);
  342. err = notify_change(newdentry, &attr, NULL);
  343. inode_unlock(newdentry->d_inode);
  344. if (err)
  345. goto out_cleanup;
  346. }
  347. if (!hardlink) {
  348. err = ovl_set_upper_acl(newdentry, XATTR_NAME_POSIX_ACL_ACCESS,
  349. acl);
  350. if (err)
  351. goto out_cleanup;
  352. err = ovl_set_upper_acl(newdentry, XATTR_NAME_POSIX_ACL_DEFAULT,
  353. default_acl);
  354. if (err)
  355. goto out_cleanup;
  356. }
  357. if (!hardlink && S_ISDIR(cattr->mode)) {
  358. err = ovl_set_opaque(dentry, newdentry);
  359. if (err)
  360. goto out_cleanup;
  361. err = ovl_do_rename(wdir, newdentry, udir, upper,
  362. RENAME_EXCHANGE);
  363. if (err)
  364. goto out_cleanup;
  365. ovl_cleanup(wdir, upper);
  366. } else {
  367. err = ovl_do_rename(wdir, newdentry, udir, upper, 0);
  368. if (err)
  369. goto out_cleanup;
  370. }
  371. ovl_instantiate(dentry, inode, newdentry, !!hardlink);
  372. newdentry = NULL;
  373. out_dput2:
  374. dput(upper);
  375. out_dput:
  376. dput(newdentry);
  377. out_unlock:
  378. unlock_rename(workdir, upperdir);
  379. out:
  380. if (!hardlink) {
  381. posix_acl_release(acl);
  382. posix_acl_release(default_acl);
  383. }
  384. return err;
  385. out_cleanup:
  386. ovl_cleanup(wdir, newdentry);
  387. goto out_dput2;
  388. }
  389. static int ovl_create_or_link(struct dentry *dentry, struct inode *inode,
  390. struct cattr *attr, struct dentry *hardlink,
  391. bool origin)
  392. {
  393. int err;
  394. const struct cred *old_cred;
  395. struct cred *override_cred;
  396. struct dentry *parent = dentry->d_parent;
  397. err = ovl_copy_up(parent);
  398. if (err)
  399. return err;
  400. old_cred = ovl_override_creds(dentry->d_sb);
  401. /*
  402. * When linking a file with copy up origin into a new parent, mark the
  403. * new parent dir "impure".
  404. */
  405. if (origin) {
  406. err = ovl_set_impure(parent, ovl_dentry_upper(parent));
  407. if (err)
  408. goto out_revert_creds;
  409. }
  410. err = -ENOMEM;
  411. override_cred = prepare_creds();
  412. if (override_cred) {
  413. override_cred->fsuid = inode->i_uid;
  414. override_cred->fsgid = inode->i_gid;
  415. if (!hardlink) {
  416. err = security_dentry_create_files_as(dentry,
  417. attr->mode, &dentry->d_name, old_cred,
  418. override_cred);
  419. if (err) {
  420. put_cred(override_cred);
  421. goto out_revert_creds;
  422. }
  423. }
  424. put_cred(override_creds(override_cred));
  425. put_cred(override_cred);
  426. if (!ovl_dentry_is_whiteout(dentry))
  427. err = ovl_create_upper(dentry, inode, attr,
  428. hardlink);
  429. else
  430. err = ovl_create_over_whiteout(dentry, inode, attr,
  431. hardlink);
  432. }
  433. out_revert_creds:
  434. revert_creds(old_cred);
  435. if (!err) {
  436. struct inode *realinode = d_inode(ovl_dentry_upper(dentry));
  437. WARN_ON(inode->i_mode != realinode->i_mode);
  438. WARN_ON(!uid_eq(inode->i_uid, realinode->i_uid));
  439. WARN_ON(!gid_eq(inode->i_gid, realinode->i_gid));
  440. }
  441. return err;
  442. }
  443. static int ovl_create_object(struct dentry *dentry, int mode, dev_t rdev,
  444. const char *link)
  445. {
  446. int err;
  447. struct inode *inode;
  448. struct cattr attr = {
  449. .rdev = rdev,
  450. .link = link,
  451. };
  452. err = ovl_want_write(dentry);
  453. if (err)
  454. goto out;
  455. err = -ENOMEM;
  456. inode = ovl_new_inode(dentry->d_sb, mode, rdev);
  457. if (!inode)
  458. goto out_drop_write;
  459. inode_init_owner(inode, dentry->d_parent->d_inode, mode);
  460. attr.mode = inode->i_mode;
  461. err = ovl_create_or_link(dentry, inode, &attr, NULL, false);
  462. if (err)
  463. iput(inode);
  464. out_drop_write:
  465. ovl_drop_write(dentry);
  466. out:
  467. return err;
  468. }
  469. static int ovl_create(struct inode *dir, struct dentry *dentry, umode_t mode,
  470. bool excl)
  471. {
  472. return ovl_create_object(dentry, (mode & 07777) | S_IFREG, 0, NULL);
  473. }
  474. static int ovl_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode)
  475. {
  476. return ovl_create_object(dentry, (mode & 07777) | S_IFDIR, 0, NULL);
  477. }
  478. static int ovl_mknod(struct inode *dir, struct dentry *dentry, umode_t mode,
  479. dev_t rdev)
  480. {
  481. /* Don't allow creation of "whiteout" on overlay */
  482. if (S_ISCHR(mode) && rdev == WHITEOUT_DEV)
  483. return -EPERM;
  484. return ovl_create_object(dentry, mode, rdev, NULL);
  485. }
  486. static int ovl_symlink(struct inode *dir, struct dentry *dentry,
  487. const char *link)
  488. {
  489. return ovl_create_object(dentry, S_IFLNK, 0, link);
  490. }
  491. static int ovl_link(struct dentry *old, struct inode *newdir,
  492. struct dentry *new)
  493. {
  494. int err;
  495. bool locked = false;
  496. struct inode *inode;
  497. err = ovl_want_write(old);
  498. if (err)
  499. goto out;
  500. err = ovl_copy_up(old);
  501. if (err)
  502. goto out_drop_write;
  503. err = ovl_nlink_start(old, &locked);
  504. if (err)
  505. goto out_drop_write;
  506. inode = d_inode(old);
  507. ihold(inode);
  508. err = ovl_create_or_link(new, inode, NULL, ovl_dentry_upper(old),
  509. ovl_type_origin(old));
  510. if (err)
  511. iput(inode);
  512. ovl_nlink_end(old, locked);
  513. out_drop_write:
  514. ovl_drop_write(old);
  515. out:
  516. return err;
  517. }
  518. static bool ovl_matches_upper(struct dentry *dentry, struct dentry *upper)
  519. {
  520. return d_inode(ovl_dentry_upper(dentry)) == d_inode(upper);
  521. }
  522. static int ovl_remove_and_whiteout(struct dentry *dentry,
  523. struct list_head *list)
  524. {
  525. struct dentry *workdir = ovl_workdir(dentry);
  526. struct dentry *upperdir = ovl_dentry_upper(dentry->d_parent);
  527. struct dentry *upper;
  528. struct dentry *opaquedir = NULL;
  529. int err;
  530. if (WARN_ON(!workdir))
  531. return -EROFS;
  532. if (!list_empty(list)) {
  533. opaquedir = ovl_clear_empty(dentry, list);
  534. err = PTR_ERR(opaquedir);
  535. if (IS_ERR(opaquedir))
  536. goto out;
  537. }
  538. err = ovl_lock_rename_workdir(workdir, upperdir);
  539. if (err)
  540. goto out_dput;
  541. upper = lookup_one_len(dentry->d_name.name, upperdir,
  542. dentry->d_name.len);
  543. err = PTR_ERR(upper);
  544. if (IS_ERR(upper))
  545. goto out_unlock;
  546. err = -ESTALE;
  547. if ((opaquedir && upper != opaquedir) ||
  548. (!opaquedir && ovl_dentry_upper(dentry) &&
  549. !ovl_matches_upper(dentry, upper))) {
  550. goto out_dput_upper;
  551. }
  552. err = ovl_cleanup_and_whiteout(workdir, d_inode(upperdir), upper);
  553. if (err)
  554. goto out_d_drop;
  555. ovl_dentry_version_inc(dentry->d_parent, true);
  556. out_d_drop:
  557. d_drop(dentry);
  558. out_dput_upper:
  559. dput(upper);
  560. out_unlock:
  561. unlock_rename(workdir, upperdir);
  562. out_dput:
  563. dput(opaquedir);
  564. out:
  565. return err;
  566. }
  567. static int ovl_remove_upper(struct dentry *dentry, bool is_dir,
  568. struct list_head *list)
  569. {
  570. struct dentry *upperdir = ovl_dentry_upper(dentry->d_parent);
  571. struct inode *dir = upperdir->d_inode;
  572. struct dentry *upper;
  573. struct dentry *opaquedir = NULL;
  574. int err;
  575. if (!list_empty(list)) {
  576. opaquedir = ovl_clear_empty(dentry, list);
  577. err = PTR_ERR(opaquedir);
  578. if (IS_ERR(opaquedir))
  579. goto out;
  580. }
  581. inode_lock_nested(dir, I_MUTEX_PARENT);
  582. upper = lookup_one_len(dentry->d_name.name, upperdir,
  583. dentry->d_name.len);
  584. err = PTR_ERR(upper);
  585. if (IS_ERR(upper))
  586. goto out_unlock;
  587. err = -ESTALE;
  588. if ((opaquedir && upper != opaquedir) ||
  589. (!opaquedir && !ovl_matches_upper(dentry, upper)))
  590. goto out_dput_upper;
  591. if (is_dir)
  592. err = vfs_rmdir(dir, upper);
  593. else
  594. err = vfs_unlink(dir, upper, NULL);
  595. ovl_dentry_version_inc(dentry->d_parent, ovl_type_origin(dentry));
  596. /*
  597. * Keeping this dentry hashed would mean having to release
  598. * upperpath/lowerpath, which could only be done if we are the
  599. * sole user of this dentry. Too tricky... Just unhash for
  600. * now.
  601. */
  602. if (!err)
  603. d_drop(dentry);
  604. out_dput_upper:
  605. dput(upper);
  606. out_unlock:
  607. inode_unlock(dir);
  608. dput(opaquedir);
  609. out:
  610. return err;
  611. }
  612. static bool ovl_pure_upper(struct dentry *dentry)
  613. {
  614. return !ovl_dentry_lower(dentry) &&
  615. !ovl_test_flag(OVL_WHITEOUTS, d_inode(dentry));
  616. }
  617. static int ovl_do_remove(struct dentry *dentry, bool is_dir)
  618. {
  619. int err;
  620. bool locked = false;
  621. const struct cred *old_cred;
  622. bool lower_positive = ovl_lower_positive(dentry);
  623. LIST_HEAD(list);
  624. /* No need to clean pure upper removed by vfs_rmdir() */
  625. if (is_dir && (lower_positive || !ovl_pure_upper(dentry))) {
  626. err = ovl_check_empty_dir(dentry, &list);
  627. if (err)
  628. goto out;
  629. }
  630. err = ovl_want_write(dentry);
  631. if (err)
  632. goto out;
  633. err = ovl_copy_up(dentry->d_parent);
  634. if (err)
  635. goto out_drop_write;
  636. err = ovl_nlink_start(dentry, &locked);
  637. if (err)
  638. goto out_drop_write;
  639. old_cred = ovl_override_creds(dentry->d_sb);
  640. if (!lower_positive)
  641. err = ovl_remove_upper(dentry, is_dir, &list);
  642. else
  643. err = ovl_remove_and_whiteout(dentry, &list);
  644. revert_creds(old_cred);
  645. if (!err) {
  646. if (is_dir)
  647. clear_nlink(dentry->d_inode);
  648. else
  649. drop_nlink(dentry->d_inode);
  650. }
  651. ovl_nlink_end(dentry, locked);
  652. out_drop_write:
  653. ovl_drop_write(dentry);
  654. out:
  655. ovl_cache_free(&list);
  656. return err;
  657. }
  658. static int ovl_unlink(struct inode *dir, struct dentry *dentry)
  659. {
  660. return ovl_do_remove(dentry, false);
  661. }
  662. static int ovl_rmdir(struct inode *dir, struct dentry *dentry)
  663. {
  664. return ovl_do_remove(dentry, true);
  665. }
  666. static bool ovl_type_merge_or_lower(struct dentry *dentry)
  667. {
  668. enum ovl_path_type type = ovl_path_type(dentry);
  669. return OVL_TYPE_MERGE(type) || !OVL_TYPE_UPPER(type);
  670. }
  671. static bool ovl_can_move(struct dentry *dentry)
  672. {
  673. return ovl_redirect_dir(dentry->d_sb) ||
  674. !d_is_dir(dentry) || !ovl_type_merge_or_lower(dentry);
  675. }
  676. static char *ovl_get_redirect(struct dentry *dentry, bool samedir)
  677. {
  678. char *buf, *ret;
  679. struct dentry *d, *tmp;
  680. int buflen = ovl_redirect_max + 1;
  681. if (samedir) {
  682. ret = kstrndup(dentry->d_name.name, dentry->d_name.len,
  683. GFP_KERNEL);
  684. goto out;
  685. }
  686. buf = ret = kmalloc(buflen, GFP_KERNEL);
  687. if (!buf)
  688. goto out;
  689. buflen--;
  690. buf[buflen] = '\0';
  691. for (d = dget(dentry); !IS_ROOT(d);) {
  692. const char *name;
  693. int thislen;
  694. spin_lock(&d->d_lock);
  695. name = ovl_dentry_get_redirect(d);
  696. if (name) {
  697. thislen = strlen(name);
  698. } else {
  699. name = d->d_name.name;
  700. thislen = d->d_name.len;
  701. }
  702. /* If path is too long, fall back to userspace move */
  703. if (thislen + (name[0] != '/') > buflen) {
  704. ret = ERR_PTR(-EXDEV);
  705. spin_unlock(&d->d_lock);
  706. goto out_put;
  707. }
  708. buflen -= thislen;
  709. memcpy(&buf[buflen], name, thislen);
  710. tmp = dget_dlock(d->d_parent);
  711. spin_unlock(&d->d_lock);
  712. dput(d);
  713. d = tmp;
  714. /* Absolute redirect: finished */
  715. if (buf[buflen] == '/')
  716. break;
  717. buflen--;
  718. buf[buflen] = '/';
  719. }
  720. ret = kstrdup(&buf[buflen], GFP_KERNEL);
  721. out_put:
  722. dput(d);
  723. kfree(buf);
  724. out:
  725. return ret ? ret : ERR_PTR(-ENOMEM);
  726. }
  727. static int ovl_set_redirect(struct dentry *dentry, bool samedir)
  728. {
  729. int err;
  730. const char *redirect = ovl_dentry_get_redirect(dentry);
  731. if (redirect && (samedir || redirect[0] == '/'))
  732. return 0;
  733. redirect = ovl_get_redirect(dentry, samedir);
  734. if (IS_ERR(redirect))
  735. return PTR_ERR(redirect);
  736. err = ovl_check_setxattr(dentry, ovl_dentry_upper(dentry),
  737. OVL_XATTR_REDIRECT,
  738. redirect, strlen(redirect), -EXDEV);
  739. if (!err) {
  740. spin_lock(&dentry->d_lock);
  741. ovl_dentry_set_redirect(dentry, redirect);
  742. spin_unlock(&dentry->d_lock);
  743. } else {
  744. kfree(redirect);
  745. pr_warn_ratelimited("overlayfs: failed to set redirect (%i)\n",
  746. err);
  747. /* Fall back to userspace copy-up */
  748. err = -EXDEV;
  749. }
  750. return err;
  751. }
  752. static int ovl_rename(struct inode *olddir, struct dentry *old,
  753. struct inode *newdir, struct dentry *new,
  754. unsigned int flags)
  755. {
  756. int err;
  757. bool locked = false;
  758. struct dentry *old_upperdir;
  759. struct dentry *new_upperdir;
  760. struct dentry *olddentry;
  761. struct dentry *newdentry;
  762. struct dentry *trap;
  763. bool old_opaque;
  764. bool new_opaque;
  765. bool cleanup_whiteout = false;
  766. bool overwrite = !(flags & RENAME_EXCHANGE);
  767. bool is_dir = d_is_dir(old);
  768. bool new_is_dir = d_is_dir(new);
  769. bool samedir = olddir == newdir;
  770. struct dentry *opaquedir = NULL;
  771. const struct cred *old_cred = NULL;
  772. LIST_HEAD(list);
  773. err = -EINVAL;
  774. if (flags & ~(RENAME_EXCHANGE | RENAME_NOREPLACE))
  775. goto out;
  776. flags &= ~RENAME_NOREPLACE;
  777. /* Don't copy up directory trees */
  778. err = -EXDEV;
  779. if (!ovl_can_move(old))
  780. goto out;
  781. if (!overwrite && !ovl_can_move(new))
  782. goto out;
  783. if (overwrite && new_is_dir && !ovl_pure_upper(new)) {
  784. err = ovl_check_empty_dir(new, &list);
  785. if (err)
  786. goto out;
  787. }
  788. if (overwrite) {
  789. if (ovl_lower_positive(old)) {
  790. if (!ovl_dentry_is_whiteout(new)) {
  791. /* Whiteout source */
  792. flags |= RENAME_WHITEOUT;
  793. } else {
  794. /* Switch whiteouts */
  795. flags |= RENAME_EXCHANGE;
  796. }
  797. } else if (is_dir && ovl_dentry_is_whiteout(new)) {
  798. flags |= RENAME_EXCHANGE;
  799. cleanup_whiteout = true;
  800. }
  801. }
  802. err = ovl_want_write(old);
  803. if (err)
  804. goto out;
  805. err = ovl_copy_up(old);
  806. if (err)
  807. goto out_drop_write;
  808. err = ovl_copy_up(new->d_parent);
  809. if (err)
  810. goto out_drop_write;
  811. if (!overwrite) {
  812. err = ovl_copy_up(new);
  813. if (err)
  814. goto out_drop_write;
  815. } else {
  816. err = ovl_nlink_start(new, &locked);
  817. if (err)
  818. goto out_drop_write;
  819. }
  820. old_cred = ovl_override_creds(old->d_sb);
  821. if (!list_empty(&list)) {
  822. opaquedir = ovl_clear_empty(new, &list);
  823. err = PTR_ERR(opaquedir);
  824. if (IS_ERR(opaquedir)) {
  825. opaquedir = NULL;
  826. goto out_revert_creds;
  827. }
  828. }
  829. old_upperdir = ovl_dentry_upper(old->d_parent);
  830. new_upperdir = ovl_dentry_upper(new->d_parent);
  831. if (!samedir) {
  832. /*
  833. * When moving a merge dir or non-dir with copy up origin into
  834. * a new parent, we are marking the new parent dir "impure".
  835. * When ovl_iterate() iterates an "impure" upper dir, it will
  836. * lookup the origin inodes of the entries to fill d_ino.
  837. */
  838. if (ovl_type_origin(old)) {
  839. err = ovl_set_impure(new->d_parent, new_upperdir);
  840. if (err)
  841. goto out_revert_creds;
  842. }
  843. if (!overwrite && ovl_type_origin(new)) {
  844. err = ovl_set_impure(old->d_parent, old_upperdir);
  845. if (err)
  846. goto out_revert_creds;
  847. }
  848. }
  849. trap = lock_rename(new_upperdir, old_upperdir);
  850. olddentry = lookup_one_len(old->d_name.name, old_upperdir,
  851. old->d_name.len);
  852. err = PTR_ERR(olddentry);
  853. if (IS_ERR(olddentry))
  854. goto out_unlock;
  855. err = -ESTALE;
  856. if (!ovl_matches_upper(old, olddentry))
  857. goto out_dput_old;
  858. newdentry = lookup_one_len(new->d_name.name, new_upperdir,
  859. new->d_name.len);
  860. err = PTR_ERR(newdentry);
  861. if (IS_ERR(newdentry))
  862. goto out_dput_old;
  863. old_opaque = ovl_dentry_is_opaque(old);
  864. new_opaque = ovl_dentry_is_opaque(new);
  865. err = -ESTALE;
  866. if (d_inode(new) && ovl_dentry_upper(new)) {
  867. if (opaquedir) {
  868. if (newdentry != opaquedir)
  869. goto out_dput;
  870. } else {
  871. if (!ovl_matches_upper(new, newdentry))
  872. goto out_dput;
  873. }
  874. } else {
  875. if (!d_is_negative(newdentry) &&
  876. (!new_opaque || !ovl_is_whiteout(newdentry)))
  877. goto out_dput;
  878. }
  879. if (olddentry == trap)
  880. goto out_dput;
  881. if (newdentry == trap)
  882. goto out_dput;
  883. if (WARN_ON(olddentry->d_inode == newdentry->d_inode))
  884. goto out_dput;
  885. err = 0;
  886. if (is_dir) {
  887. if (ovl_type_merge_or_lower(old))
  888. err = ovl_set_redirect(old, samedir);
  889. else if (!old_opaque && ovl_type_merge(new->d_parent))
  890. err = ovl_set_opaque_xerr(old, olddentry, -EXDEV);
  891. if (err)
  892. goto out_dput;
  893. }
  894. if (!overwrite && new_is_dir) {
  895. if (ovl_type_merge_or_lower(new))
  896. err = ovl_set_redirect(new, samedir);
  897. else if (!new_opaque && ovl_type_merge(old->d_parent))
  898. err = ovl_set_opaque_xerr(new, newdentry, -EXDEV);
  899. if (err)
  900. goto out_dput;
  901. }
  902. err = ovl_do_rename(old_upperdir->d_inode, olddentry,
  903. new_upperdir->d_inode, newdentry, flags);
  904. if (err)
  905. goto out_dput;
  906. if (cleanup_whiteout)
  907. ovl_cleanup(old_upperdir->d_inode, newdentry);
  908. if (overwrite && d_inode(new)) {
  909. if (new_is_dir)
  910. clear_nlink(d_inode(new));
  911. else
  912. drop_nlink(d_inode(new));
  913. }
  914. ovl_dentry_version_inc(old->d_parent, ovl_type_origin(old) ||
  915. (!overwrite && ovl_type_origin(new)));
  916. ovl_dentry_version_inc(new->d_parent, ovl_type_origin(old) ||
  917. (d_inode(new) && ovl_type_origin(new)));
  918. out_dput:
  919. dput(newdentry);
  920. out_dput_old:
  921. dput(olddentry);
  922. out_unlock:
  923. unlock_rename(new_upperdir, old_upperdir);
  924. out_revert_creds:
  925. revert_creds(old_cred);
  926. ovl_nlink_end(new, locked);
  927. out_drop_write:
  928. ovl_drop_write(old);
  929. out:
  930. dput(opaquedir);
  931. ovl_cache_free(&list);
  932. return err;
  933. }
  934. const struct inode_operations ovl_dir_inode_operations = {
  935. .lookup = ovl_lookup,
  936. .mkdir = ovl_mkdir,
  937. .symlink = ovl_symlink,
  938. .unlink = ovl_unlink,
  939. .rmdir = ovl_rmdir,
  940. .rename = ovl_rename,
  941. .link = ovl_link,
  942. .setattr = ovl_setattr,
  943. .create = ovl_create,
  944. .mknod = ovl_mknod,
  945. .permission = ovl_permission,
  946. .getattr = ovl_getattr,
  947. .listxattr = ovl_listxattr,
  948. .get_acl = ovl_get_acl,
  949. .update_time = ovl_update_time,
  950. };