1
2
3
4
5
6
7
8
9
10#include <linux/capability.h>
11#include <linux/audit.h>
12#include <linux/module.h>
13#include <linux/init.h>
14#include <linux/kernel.h>
15#include <linux/security.h>
16#include <linux/file.h>
17#include <linux/mm.h>
18#include <linux/mman.h>
19#include <linux/pagemap.h>
20#include <linux/swap.h>
21#include <linux/skbuff.h>
22#include <linux/netlink.h>
23#include <linux/ptrace.h>
24#include <linux/xattr.h>
25#include <linux/hugetlb.h>
26#include <linux/mount.h>
27#include <linux/sched.h>
28#include <linux/prctl.h>
29#include <linux/securebits.h>
30#include <linux/user_namespace.h>
31
32
33
34
35
36
37
38
39
40
41
42
43static void warn_setuid_and_fcaps_mixed(const char *fname)
44{
45 static int warned;
46 if (!warned) {
47 printk(KERN_INFO "warning: `%s' has both setuid-root and"
48 " effective capabilities. Therefore not raising all"
49 " capabilities.\n", fname);
50 warned = 1;
51 }
52}
53
54int cap_netlink_send(struct sock *sk, struct sk_buff *skb)
55{
56 return 0;
57}
58
59int cap_netlink_recv(struct sk_buff *skb, int cap)
60{
61 if (!cap_raised(current_cap(), cap))
62 return -EPERM;
63 return 0;
64}
65EXPORT_SYMBOL(cap_netlink_recv);
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83int cap_capable(struct task_struct *tsk, const struct cred *cred,
84 struct user_namespace *targ_ns, int cap, int audit)
85{
86 for (;;) {
87
88 if (targ_ns != &init_user_ns && targ_ns->creator == cred->user)
89 return 0;
90
91
92 if (targ_ns == cred->user->user_ns)
93 return cap_raised(cred->cap_effective, cap) ? 0 : -EPERM;
94
95
96 if (targ_ns == &init_user_ns)
97 return -EPERM;
98
99
100
101
102
103 targ_ns = targ_ns->creator->user_ns;
104 }
105
106
107}
108
109
110
111
112
113
114
115
116
117int cap_settime(const struct timespec *ts, const struct timezone *tz)
118{
119 if (!capable(CAP_SYS_TIME))
120 return -EPERM;
121 return 0;
122}
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139int cap_ptrace_access_check(struct task_struct *child, unsigned int mode)
140{
141 int ret = 0;
142 const struct cred *cred, *child_cred;
143
144 rcu_read_lock();
145 cred = current_cred();
146 child_cred = __task_cred(child);
147 if (cred->user->user_ns == child_cred->user->user_ns &&
148 cap_issubset(child_cred->cap_permitted, cred->cap_permitted))
149 goto out;
150 if (ns_capable(child_cred->user->user_ns, CAP_SYS_PTRACE))
151 goto out;
152 ret = -EPERM;
153out:
154 rcu_read_unlock();
155 return ret;
156}
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171int cap_ptrace_traceme(struct task_struct *parent)
172{
173 int ret = 0;
174 const struct cred *cred, *child_cred;
175
176 rcu_read_lock();
177 cred = __task_cred(parent);
178 child_cred = current_cred();
179 if (cred->user->user_ns == child_cred->user->user_ns &&
180 cap_issubset(child_cred->cap_permitted, cred->cap_permitted))
181 goto out;
182 if (has_ns_capability(parent, child_cred->user->user_ns, CAP_SYS_PTRACE))
183 goto out;
184 ret = -EPERM;
185out:
186 rcu_read_unlock();
187 return ret;
188}
189
190
191
192
193
194
195
196
197
198
199
200int cap_capget(struct task_struct *target, kernel_cap_t *effective,
201 kernel_cap_t *inheritable, kernel_cap_t *permitted)
202{
203 const struct cred *cred;
204
205
206 rcu_read_lock();
207 cred = __task_cred(target);
208 *effective = cred->cap_effective;
209 *inheritable = cred->cap_inheritable;
210 *permitted = cred->cap_permitted;
211 rcu_read_unlock();
212 return 0;
213}
214
215
216
217
218
219static inline int cap_inh_is_capped(void)
220{
221
222
223
224
225 if (cap_capable(current, current_cred(),
226 current_cred()->user->user_ns, CAP_SETPCAP,
227 SECURITY_CAP_AUDIT) == 0)
228 return 0;
229 return 1;
230}
231
232
233
234
235
236
237
238
239
240
241
242
243
244int cap_capset(struct cred *new,
245 const struct cred *old,
246 const kernel_cap_t *effective,
247 const kernel_cap_t *inheritable,
248 const kernel_cap_t *permitted)
249{
250 if (cap_inh_is_capped() &&
251 !cap_issubset(*inheritable,
252 cap_combine(old->cap_inheritable,
253 old->cap_permitted)))
254
255 return -EPERM;
256
257 if (!cap_issubset(*inheritable,
258 cap_combine(old->cap_inheritable,
259 old->cap_bset)))
260
261 return -EPERM;
262
263
264 if (!cap_issubset(*permitted, old->cap_permitted))
265 return -EPERM;
266
267
268 if (!cap_issubset(*effective, *permitted))
269 return -EPERM;
270
271 new->cap_effective = *effective;
272 new->cap_inheritable = *inheritable;
273 new->cap_permitted = *permitted;
274 return 0;
275}
276
277
278
279
280static inline void bprm_clear_caps(struct linux_binprm *bprm)
281{
282 cap_clear(bprm->cred->cap_permitted);
283 bprm->cap_effective = false;
284}
285
286
287
288
289
290
291
292
293
294
295
296
297int cap_inode_need_killpriv(struct dentry *dentry)
298{
299 struct inode *inode = dentry->d_inode;
300 int error;
301
302 if (!inode->i_op->getxattr)
303 return 0;
304
305 error = inode->i_op->getxattr(dentry, XATTR_NAME_CAPS, NULL, 0);
306 if (error <= 0)
307 return 0;
308 return 1;
309}
310
311
312
313
314
315
316
317
318
319int cap_inode_killpriv(struct dentry *dentry)
320{
321 struct inode *inode = dentry->d_inode;
322
323 if (!inode->i_op->removexattr)
324 return 0;
325
326 return inode->i_op->removexattr(dentry, XATTR_NAME_CAPS);
327}
328
329
330
331
332
333static inline int bprm_caps_from_vfs_caps(struct cpu_vfs_cap_data *caps,
334 struct linux_binprm *bprm,
335 bool *effective)
336{
337 struct cred *new = bprm->cred;
338 unsigned i;
339 int ret = 0;
340
341 if (caps->magic_etc & VFS_CAP_FLAGS_EFFECTIVE)
342 *effective = true;
343
344 CAP_FOR_EACH_U32(i) {
345 __u32 permitted = caps->permitted.cap[i];
346 __u32 inheritable = caps->inheritable.cap[i];
347
348
349
350
351 new->cap_permitted.cap[i] =
352 (new->cap_bset.cap[i] & permitted) |
353 (new->cap_inheritable.cap[i] & inheritable);
354
355 if (permitted & ~new->cap_permitted.cap[i])
356
357 ret = -EPERM;
358 }
359
360
361
362
363
364
365 return *effective ? ret : 0;
366}
367
368
369
370
371int get_vfs_caps_from_disk(const struct dentry *dentry, struct cpu_vfs_cap_data *cpu_caps)
372{
373 struct inode *inode = dentry->d_inode;
374 __u32 magic_etc;
375 unsigned tocopy, i;
376 int size;
377 struct vfs_cap_data caps;
378
379 memset(cpu_caps, 0, sizeof(struct cpu_vfs_cap_data));
380
381 if (!inode || !inode->i_op->getxattr)
382 return -ENODATA;
383
384 size = inode->i_op->getxattr((struct dentry *)dentry, XATTR_NAME_CAPS, &caps,
385 XATTR_CAPS_SZ);
386 if (size == -ENODATA || size == -EOPNOTSUPP)
387
388 return -ENODATA;
389 if (size < 0)
390 return size;
391
392 if (size < sizeof(magic_etc))
393 return -EINVAL;
394
395 cpu_caps->magic_etc = magic_etc = le32_to_cpu(caps.magic_etc);
396
397 switch (magic_etc & VFS_CAP_REVISION_MASK) {
398 case VFS_CAP_REVISION_1:
399 if (size != XATTR_CAPS_SZ_1)
400 return -EINVAL;
401 tocopy = VFS_CAP_U32_1;
402 break;
403 case VFS_CAP_REVISION_2:
404 if (size != XATTR_CAPS_SZ_2)
405 return -EINVAL;
406 tocopy = VFS_CAP_U32_2;
407 break;
408 default:
409 return -EINVAL;
410 }
411
412 CAP_FOR_EACH_U32(i) {
413 if (i >= tocopy)
414 break;
415 cpu_caps->permitted.cap[i] = le32_to_cpu(caps.data[i].permitted);
416 cpu_caps->inheritable.cap[i] = le32_to_cpu(caps.data[i].inheritable);
417 }
418
419 return 0;
420}
421
422
423
424
425
426
427static int get_file_caps(struct linux_binprm *bprm, bool *effective)
428{
429 struct dentry *dentry;
430 int rc = 0;
431 struct cpu_vfs_cap_data vcaps;
432
433 bprm_clear_caps(bprm);
434
435 if (!file_caps_enabled)
436 return 0;
437
438 if (bprm->file->f_vfsmnt->mnt_flags & MNT_NOSUID)
439 return 0;
440
441 dentry = dget(bprm->file->f_dentry);
442
443 rc = get_vfs_caps_from_disk(dentry, &vcaps);
444 if (rc < 0) {
445 if (rc == -EINVAL)
446 printk(KERN_NOTICE "%s: get_vfs_caps_from_disk returned %d for %s\n",
447 __func__, rc, bprm->filename);
448 else if (rc == -ENODATA)
449 rc = 0;
450 goto out;
451 }
452
453 rc = bprm_caps_from_vfs_caps(&vcaps, bprm, effective);
454 if (rc == -EINVAL)
455 printk(KERN_NOTICE "%s: cap_from_disk returned %d for %s\n",
456 __func__, rc, bprm->filename);
457
458out:
459 dput(dentry);
460 if (rc)
461 bprm_clear_caps(bprm);
462
463 return rc;
464}
465
466
467
468
469
470
471
472
473
474int cap_bprm_set_creds(struct linux_binprm *bprm)
475{
476 const struct cred *old = current_cred();
477 struct cred *new = bprm->cred;
478 bool effective;
479 int ret;
480
481 effective = false;
482 ret = get_file_caps(bprm, &effective);
483 if (ret < 0)
484 return ret;
485
486 if (!issecure(SECURE_NOROOT)) {
487
488
489
490
491
492 if (effective && new->uid != 0 && new->euid == 0) {
493 warn_setuid_and_fcaps_mixed(bprm->filename);
494 goto skip;
495 }
496
497
498
499
500
501
502
503 if (new->euid == 0 || new->uid == 0) {
504
505 new->cap_permitted = cap_combine(old->cap_bset,
506 old->cap_inheritable);
507 }
508 if (new->euid == 0)
509 effective = true;
510 }
511skip:
512
513
514
515
516 if ((new->euid != old->uid ||
517 new->egid != old->gid ||
518 !cap_issubset(new->cap_permitted, old->cap_permitted)) &&
519 bprm->unsafe & ~LSM_UNSAFE_PTRACE_CAP) {
520
521 if (!capable(CAP_SETUID)) {
522 new->euid = new->uid;
523 new->egid = new->gid;
524 }
525 new->cap_permitted = cap_intersect(new->cap_permitted,
526 old->cap_permitted);
527 }
528
529 new->suid = new->fsuid = new->euid;
530 new->sgid = new->fsgid = new->egid;
531
532 if (effective)
533 new->cap_effective = new->cap_permitted;
534 else
535 cap_clear(new->cap_effective);
536 bprm->cap_effective = effective;
537
538
539
540
541
542
543
544
545
546
547
548
549
550 if (!cap_isclear(new->cap_effective)) {
551 if (!cap_issubset(CAP_FULL_SET, new->cap_effective) ||
552 new->euid != 0 || new->uid != 0 ||
553 issecure(SECURE_NOROOT)) {
554 ret = audit_log_bprm_fcaps(bprm, new, old);
555 if (ret < 0)
556 return ret;
557 }
558 }
559
560 new->securebits &= ~issecure_mask(SECURE_KEEP_CAPS);
561 return 0;
562}
563
564
565
566
567
568
569
570
571
572
573
574int cap_bprm_secureexec(struct linux_binprm *bprm)
575{
576 const struct cred *cred = current_cred();
577
578 if (cred->uid != 0) {
579 if (bprm->cap_effective)
580 return 1;
581 if (!cap_isclear(cred->cap_permitted))
582 return 1;
583 }
584
585 return (cred->euid != cred->uid ||
586 cred->egid != cred->gid);
587}
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603int cap_inode_setxattr(struct dentry *dentry, const char *name,
604 const void *value, size_t size, int flags)
605{
606 if (!strcmp(name, XATTR_NAME_CAPS)) {
607 if (!capable(CAP_SETFCAP))
608 return -EPERM;
609 return 0;
610 }
611
612 if (!strncmp(name, XATTR_SECURITY_PREFIX,
613 sizeof(XATTR_SECURITY_PREFIX) - 1) &&
614 !capable(CAP_SYS_ADMIN))
615 return -EPERM;
616 return 0;
617}
618
619
620
621
622
623
624
625
626
627
628
629
630int cap_inode_removexattr(struct dentry *dentry, const char *name)
631{
632 if (!strcmp(name, XATTR_NAME_CAPS)) {
633 if (!capable(CAP_SETFCAP))
634 return -EPERM;
635 return 0;
636 }
637
638 if (!strncmp(name, XATTR_SECURITY_PREFIX,
639 sizeof(XATTR_SECURITY_PREFIX) - 1) &&
640 !capable(CAP_SYS_ADMIN))
641 return -EPERM;
642 return 0;
643}
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674static inline void cap_emulate_setxuid(struct cred *new, const struct cred *old)
675{
676 if ((old->uid == 0 || old->euid == 0 || old->suid == 0) &&
677 (new->uid != 0 && new->euid != 0 && new->suid != 0) &&
678 !issecure(SECURE_KEEP_CAPS)) {
679 cap_clear(new->cap_permitted);
680 cap_clear(new->cap_effective);
681 }
682 if (old->euid == 0 && new->euid != 0)
683 cap_clear(new->cap_effective);
684 if (old->euid != 0 && new->euid == 0)
685 new->cap_effective = new->cap_permitted;
686}
687
688
689
690
691
692
693
694
695
696
697int cap_task_fix_setuid(struct cred *new, const struct cred *old, int flags)
698{
699 switch (flags) {
700 case LSM_SETID_RE:
701 case LSM_SETID_ID:
702 case LSM_SETID_RES:
703
704
705 if (!issecure(SECURE_NO_SETUID_FIXUP))
706 cap_emulate_setxuid(new, old);
707 break;
708
709 case LSM_SETID_FS:
710
711
712
713
714
715
716 if (!issecure(SECURE_NO_SETUID_FIXUP)) {
717 if (old->fsuid == 0 && new->fsuid != 0)
718 new->cap_effective =
719 cap_drop_fs_set(new->cap_effective);
720
721 if (old->fsuid != 0 && new->fsuid == 0)
722 new->cap_effective =
723 cap_raise_fs_set(new->cap_effective,
724 new->cap_permitted);
725 }
726 break;
727
728 default:
729 return -EINVAL;
730 }
731
732 return 0;
733}
734
735
736
737
738
739
740
741
742
743
744
745static int cap_safe_nice(struct task_struct *p)
746{
747 int is_subset;
748
749 rcu_read_lock();
750 is_subset = cap_issubset(__task_cred(p)->cap_permitted,
751 current_cred()->cap_permitted);
752 rcu_read_unlock();
753
754 if (!is_subset && !capable(CAP_SYS_NICE))
755 return -EPERM;
756 return 0;
757}
758
759
760
761
762
763
764
765
766int cap_task_setscheduler(struct task_struct *p)
767{
768 return cap_safe_nice(p);
769}
770
771
772
773
774
775
776
777
778
779int cap_task_setioprio(struct task_struct *p, int ioprio)
780{
781 return cap_safe_nice(p);
782}
783
784
785
786
787
788
789
790
791
792int cap_task_setnice(struct task_struct *p, int nice)
793{
794 return cap_safe_nice(p);
795}
796
797
798
799
800
801static long cap_prctl_drop(struct cred *new, unsigned long cap)
802{
803 if (!capable(CAP_SETPCAP))
804 return -EPERM;
805 if (!cap_valid(cap))
806 return -EINVAL;
807
808 cap_lower(new->cap_bset, cap);
809 return 0;
810}
811
812
813
814
815
816
817
818
819
820
821
822
823
824int cap_task_prctl(int option, unsigned long arg2, unsigned long arg3,
825 unsigned long arg4, unsigned long arg5)
826{
827 struct cred *new;
828 long error = 0;
829
830 new = prepare_creds();
831 if (!new)
832 return -ENOMEM;
833
834 switch (option) {
835 case PR_CAPBSET_READ:
836 error = -EINVAL;
837 if (!cap_valid(arg2))
838 goto error;
839 error = !!cap_raised(new->cap_bset, arg2);
840 goto no_change;
841
842 case PR_CAPBSET_DROP:
843 error = cap_prctl_drop(new, arg2);
844 if (error < 0)
845 goto error;
846 goto changed;
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867 case PR_SET_SECUREBITS:
868 error = -EPERM;
869 if ((((new->securebits & SECURE_ALL_LOCKS) >> 1)
870 & (new->securebits ^ arg2))
871 || ((new->securebits & SECURE_ALL_LOCKS & ~arg2))
872 || (arg2 & ~(SECURE_ALL_LOCKS | SECURE_ALL_BITS))
873 || (cap_capable(current, current_cred(),
874 current_cred()->user->user_ns, CAP_SETPCAP,
875 SECURITY_CAP_AUDIT) != 0)
876
877
878
879
880
881
882
883 )
884
885 goto error;
886 new->securebits = arg2;
887 goto changed;
888
889 case PR_GET_SECUREBITS:
890 error = new->securebits;
891 goto no_change;
892
893 case PR_GET_KEEPCAPS:
894 if (issecure(SECURE_KEEP_CAPS))
895 error = 1;
896 goto no_change;
897
898 case PR_SET_KEEPCAPS:
899 error = -EINVAL;
900 if (arg2 > 1)
901 goto error;
902 error = -EPERM;
903 if (issecure(SECURE_KEEP_CAPS_LOCKED))
904 goto error;
905 if (arg2)
906 new->securebits |= issecure_mask(SECURE_KEEP_CAPS);
907 else
908 new->securebits &= ~issecure_mask(SECURE_KEEP_CAPS);
909 goto changed;
910
911 default:
912
913 error = -ENOSYS;
914 goto error;
915 }
916
917
918changed:
919 return commit_creds(new);
920
921no_change:
922error:
923 abort_creds(new);
924 return error;
925}
926
927
928
929
930
931
932
933
934
935int cap_vm_enough_memory(struct mm_struct *mm, long pages)
936{
937 int cap_sys_admin = 0;
938
939 if (cap_capable(current, current_cred(), &init_user_ns, CAP_SYS_ADMIN,
940 SECURITY_CAP_NOAUDIT) == 0)
941 cap_sys_admin = 1;
942 return __vm_enough_memory(mm, pages, cap_sys_admin);
943}
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959int cap_file_mmap(struct file *file, unsigned long reqprot,
960 unsigned long prot, unsigned long flags,
961 unsigned long addr, unsigned long addr_only)
962{
963 int ret = 0;
964
965 if (addr < dac_mmap_min_addr) {
966 ret = cap_capable(current, current_cred(), &init_user_ns, CAP_SYS_RAWIO,
967 SECURITY_CAP_AUDIT);
968
969 if (ret == 0)
970 current->flags |= PF_SUPERPRIV;
971 }
972 return ret;
973}
974