1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22#include <linux/kernel_stat.h>
23#include <linux/module.h>
24#include <linux/interrupt.h>
25#include <linux/percpu.h>
26#include <linux/init.h>
27#include <linux/mm.h>
28#include <linux/swap.h>
29#include <linux/pid_namespace.h>
30#include <linux/notifier.h>
31#include <linux/thread_info.h>
32#include <linux/time.h>
33#include <linux/jiffies.h>
34#include <linux/posix-timers.h>
35#include <linux/cpu.h>
36#include <linux/syscalls.h>
37#include <linux/delay.h>
38#include <linux/tick.h>
39#include <linux/kallsyms.h>
40#include <linux/perf_event.h>
41#include <linux/sched.h>
42#include <linux/slab.h>
43
44#include <asm/uaccess.h>
45#include <asm/unistd.h>
46#include <asm/div64.h>
47#include <asm/timex.h>
48#include <asm/io.h>
49
50#define CREATE_TRACE_POINTS
51#include <trace/events/timer.h>
52
53u64 jiffies_64 __cacheline_aligned_in_smp = INITIAL_JIFFIES;
54
55EXPORT_SYMBOL(jiffies_64);
56
57
58
59
60#define TVN_BITS (CONFIG_BASE_SMALL ? 4 : 6)
61#define TVR_BITS (CONFIG_BASE_SMALL ? 6 : 8)
62#define TVN_SIZE (1 << TVN_BITS)
63#define TVR_SIZE (1 << TVR_BITS)
64#define TVN_MASK (TVN_SIZE - 1)
65#define TVR_MASK (TVR_SIZE - 1)
66
67struct tvec {
68 struct list_head vec[TVN_SIZE];
69};
70
71struct tvec_root {
72 struct list_head vec[TVR_SIZE];
73};
74
75struct tvec_base {
76 spinlock_t lock;
77 struct timer_list *running_timer;
78 unsigned long timer_jiffies;
79 unsigned long next_timer;
80 struct tvec_root tv1;
81 struct tvec tv2;
82 struct tvec tv3;
83 struct tvec tv4;
84 struct tvec tv5;
85} ____cacheline_aligned;
86
87struct tvec_base boot_tvec_bases;
88EXPORT_SYMBOL(boot_tvec_bases);
89static DEFINE_PER_CPU(struct tvec_base *, tvec_bases) = &boot_tvec_bases;
90
91
92
93
94
95
96#define TBASE_DEFERRABLE_FLAG (0x1)
97
98
99static inline unsigned int tbase_get_deferrable(struct tvec_base *base)
100{
101 return ((unsigned int)(unsigned long)base & TBASE_DEFERRABLE_FLAG);
102}
103
104static inline struct tvec_base *tbase_get_base(struct tvec_base *base)
105{
106 return ((struct tvec_base *)((unsigned long)base & ~TBASE_DEFERRABLE_FLAG));
107}
108
109static inline void timer_set_deferrable(struct timer_list *timer)
110{
111 timer->base = ((struct tvec_base *)((unsigned long)(timer->base) |
112 TBASE_DEFERRABLE_FLAG));
113}
114
115static inline void
116timer_set_base(struct timer_list *timer, struct tvec_base *new_base)
117{
118 timer->base = (struct tvec_base *)((unsigned long)(new_base) |
119 tbase_get_deferrable(timer->base));
120}
121
122static unsigned long round_jiffies_common(unsigned long j, int cpu,
123 bool force_up)
124{
125 int rem;
126 unsigned long original = j;
127
128
129
130
131
132
133
134
135
136 j += cpu * 3;
137
138 rem = j % HZ;
139
140
141
142
143
144
145
146
147 if (rem < HZ/4 && !force_up)
148 j = j - rem;
149 else
150 j = j - rem + HZ;
151
152
153 j -= cpu * 3;
154
155 if (j <= jiffies)
156 return original;
157 return j;
158}
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180unsigned long __round_jiffies(unsigned long j, int cpu)
181{
182 return round_jiffies_common(j, cpu, false);
183}
184EXPORT_SYMBOL_GPL(__round_jiffies);
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206unsigned long __round_jiffies_relative(unsigned long j, int cpu)
207{
208 unsigned long j0 = jiffies;
209
210
211 return round_jiffies_common(j + j0, cpu, false) - j0;
212}
213EXPORT_SYMBOL_GPL(__round_jiffies_relative);
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230unsigned long round_jiffies(unsigned long j)
231{
232 return round_jiffies_common(j, raw_smp_processor_id(), false);
233}
234EXPORT_SYMBOL_GPL(round_jiffies);
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251unsigned long round_jiffies_relative(unsigned long j)
252{
253 return __round_jiffies_relative(j, raw_smp_processor_id());
254}
255EXPORT_SYMBOL_GPL(round_jiffies_relative);
256
257
258
259
260
261
262
263
264
265
266
267unsigned long __round_jiffies_up(unsigned long j, int cpu)
268{
269 return round_jiffies_common(j, cpu, true);
270}
271EXPORT_SYMBOL_GPL(__round_jiffies_up);
272
273
274
275
276
277
278
279
280
281
282
283unsigned long __round_jiffies_up_relative(unsigned long j, int cpu)
284{
285 unsigned long j0 = jiffies;
286
287
288 return round_jiffies_common(j + j0, cpu, true) - j0;
289}
290EXPORT_SYMBOL_GPL(__round_jiffies_up_relative);
291
292
293
294
295
296
297
298
299
300
301unsigned long round_jiffies_up(unsigned long j)
302{
303 return round_jiffies_common(j, raw_smp_processor_id(), true);
304}
305EXPORT_SYMBOL_GPL(round_jiffies_up);
306
307
308
309
310
311
312
313
314
315
316unsigned long round_jiffies_up_relative(unsigned long j)
317{
318 return __round_jiffies_up_relative(j, raw_smp_processor_id());
319}
320EXPORT_SYMBOL_GPL(round_jiffies_up_relative);
321
322
323static inline void set_running_timer(struct tvec_base *base,
324 struct timer_list *timer)
325{
326#ifdef CONFIG_SMP
327 base->running_timer = timer;
328#endif
329}
330
331static void internal_add_timer(struct tvec_base *base, struct timer_list *timer)
332{
333 unsigned long expires = timer->expires;
334 unsigned long idx = expires - base->timer_jiffies;
335 struct list_head *vec;
336
337 if (idx < TVR_SIZE) {
338 int i = expires & TVR_MASK;
339 vec = base->tv1.vec + i;
340 } else if (idx < 1 << (TVR_BITS + TVN_BITS)) {
341 int i = (expires >> TVR_BITS) & TVN_MASK;
342 vec = base->tv2.vec + i;
343 } else if (idx < 1 << (TVR_BITS + 2 * TVN_BITS)) {
344 int i = (expires >> (TVR_BITS + TVN_BITS)) & TVN_MASK;
345 vec = base->tv3.vec + i;
346 } else if (idx < 1 << (TVR_BITS + 3 * TVN_BITS)) {
347 int i = (expires >> (TVR_BITS + 2 * TVN_BITS)) & TVN_MASK;
348 vec = base->tv4.vec + i;
349 } else if ((signed long) idx < 0) {
350
351
352
353
354 vec = base->tv1.vec + (base->timer_jiffies & TVR_MASK);
355 } else {
356 int i;
357
358
359
360 if (idx > 0xffffffffUL) {
361 idx = 0xffffffffUL;
362 expires = idx + base->timer_jiffies;
363 }
364 i = (expires >> (TVR_BITS + 3 * TVN_BITS)) & TVN_MASK;
365 vec = base->tv5.vec + i;
366 }
367
368
369
370 list_add_tail(&timer->entry, vec);
371}
372
373#ifdef CONFIG_TIMER_STATS
374void __timer_stats_timer_set_start_info(struct timer_list *timer, void *addr)
375{
376 if (timer->start_site)
377 return;
378
379 timer->start_site = addr;
380 memcpy(timer->start_comm, current->comm, TASK_COMM_LEN);
381 timer->start_pid = current->pid;
382}
383
384static void timer_stats_account_timer(struct timer_list *timer)
385{
386 unsigned int flag = 0;
387
388 if (likely(!timer->start_site))
389 return;
390 if (unlikely(tbase_get_deferrable(timer->base)))
391 flag |= TIMER_STATS_FLAG_DEFERRABLE;
392
393 timer_stats_update_stats(timer, timer->start_pid, timer->start_site,
394 timer->function, timer->start_comm, flag);
395}
396
397#else
398static void timer_stats_account_timer(struct timer_list *timer) {}
399#endif
400
401#ifdef CONFIG_DEBUG_OBJECTS_TIMERS
402
403static struct debug_obj_descr timer_debug_descr;
404
405
406
407
408
409static int timer_fixup_init(void *addr, enum debug_obj_state state)
410{
411 struct timer_list *timer = addr;
412
413 switch (state) {
414 case ODEBUG_STATE_ACTIVE:
415 del_timer_sync(timer);
416 debug_object_init(timer, &timer_debug_descr);
417 return 1;
418 default:
419 return 0;
420 }
421}
422
423
424
425
426
427
428static int timer_fixup_activate(void *addr, enum debug_obj_state state)
429{
430 struct timer_list *timer = addr;
431
432 switch (state) {
433
434 case ODEBUG_STATE_NOTAVAILABLE:
435
436
437
438
439
440 if (timer->entry.next == NULL &&
441 timer->entry.prev == TIMER_ENTRY_STATIC) {
442 debug_object_init(timer, &timer_debug_descr);
443 debug_object_activate(timer, &timer_debug_descr);
444 return 0;
445 } else {
446 WARN_ON_ONCE(1);
447 }
448 return 0;
449
450 case ODEBUG_STATE_ACTIVE:
451 WARN_ON(1);
452
453 default:
454 return 0;
455 }
456}
457
458
459
460
461
462static int timer_fixup_free(void *addr, enum debug_obj_state state)
463{
464 struct timer_list *timer = addr;
465
466 switch (state) {
467 case ODEBUG_STATE_ACTIVE:
468 del_timer_sync(timer);
469 debug_object_free(timer, &timer_debug_descr);
470 return 1;
471 default:
472 return 0;
473 }
474}
475
476static struct debug_obj_descr timer_debug_descr = {
477 .name = "timer_list",
478 .fixup_init = timer_fixup_init,
479 .fixup_activate = timer_fixup_activate,
480 .fixup_free = timer_fixup_free,
481};
482
483static inline void debug_timer_init(struct timer_list *timer)
484{
485 debug_object_init(timer, &timer_debug_descr);
486}
487
488static inline void debug_timer_activate(struct timer_list *timer)
489{
490 debug_object_activate(timer, &timer_debug_descr);
491}
492
493static inline void debug_timer_deactivate(struct timer_list *timer)
494{
495 debug_object_deactivate(timer, &timer_debug_descr);
496}
497
498static inline void debug_timer_free(struct timer_list *timer)
499{
500 debug_object_free(timer, &timer_debug_descr);
501}
502
503static void __init_timer(struct timer_list *timer,
504 const char *name,
505 struct lock_class_key *key);
506
507void init_timer_on_stack_key(struct timer_list *timer,
508 const char *name,
509 struct lock_class_key *key)
510{
511 debug_object_init_on_stack(timer, &timer_debug_descr);
512 __init_timer(timer, name, key);
513}
514EXPORT_SYMBOL_GPL(init_timer_on_stack_key);
515
516void destroy_timer_on_stack(struct timer_list *timer)
517{
518 debug_object_free(timer, &timer_debug_descr);
519}
520EXPORT_SYMBOL_GPL(destroy_timer_on_stack);
521
522#else
523static inline void debug_timer_init(struct timer_list *timer) { }
524static inline void debug_timer_activate(struct timer_list *timer) { }
525static inline void debug_timer_deactivate(struct timer_list *timer) { }
526#endif
527
528static inline void debug_init(struct timer_list *timer)
529{
530 debug_timer_init(timer);
531 trace_timer_init(timer);
532}
533
534static inline void
535debug_activate(struct timer_list *timer, unsigned long expires)
536{
537 debug_timer_activate(timer);
538 trace_timer_start(timer, expires);
539}
540
541static inline void debug_deactivate(struct timer_list *timer)
542{
543 debug_timer_deactivate(timer);
544 trace_timer_cancel(timer);
545}
546
547static void __init_timer(struct timer_list *timer,
548 const char *name,
549 struct lock_class_key *key)
550{
551 timer->entry.next = NULL;
552 timer->base = __raw_get_cpu_var(tvec_bases);
553#ifdef CONFIG_TIMER_STATS
554 timer->start_site = NULL;
555 timer->start_pid = -1;
556 memset(timer->start_comm, 0, TASK_COMM_LEN);
557#endif
558 lockdep_init_map(&timer->lockdep_map, name, key, 0);
559}
560
561
562
563
564
565
566
567
568
569
570
571void init_timer_key(struct timer_list *timer,
572 const char *name,
573 struct lock_class_key *key)
574{
575 debug_init(timer);
576 __init_timer(timer, name, key);
577}
578EXPORT_SYMBOL(init_timer_key);
579
580void init_timer_deferrable_key(struct timer_list *timer,
581 const char *name,
582 struct lock_class_key *key)
583{
584 init_timer_key(timer, name, key);
585 timer_set_deferrable(timer);
586}
587EXPORT_SYMBOL(init_timer_deferrable_key);
588
589static inline void detach_timer(struct timer_list *timer,
590 int clear_pending)
591{
592 struct list_head *entry = &timer->entry;
593
594 debug_deactivate(timer);
595
596 __list_del(entry->prev, entry->next);
597 if (clear_pending)
598 entry->next = NULL;
599 entry->prev = LIST_POISON2;
600}
601
602
603
604
605
606
607
608
609
610
611
612
613
614static struct tvec_base *lock_timer_base(struct timer_list *timer,
615 unsigned long *flags)
616 __acquires(timer->base->lock)
617{
618 struct tvec_base *base;
619
620 for (;;) {
621 struct tvec_base *prelock_base = timer->base;
622 base = tbase_get_base(prelock_base);
623 if (likely(base != NULL)) {
624 spin_lock_irqsave(&base->lock, *flags);
625 if (likely(prelock_base == timer->base))
626 return base;
627
628 spin_unlock_irqrestore(&base->lock, *flags);
629 }
630 cpu_relax();
631 }
632}
633
634static inline int
635__mod_timer(struct timer_list *timer, unsigned long expires,
636 bool pending_only, int pinned)
637{
638 struct tvec_base *base, *new_base;
639 unsigned long flags;
640 int ret = 0 , cpu;
641
642 timer_stats_timer_set_start_info(timer);
643 BUG_ON(!timer->function);
644
645 base = lock_timer_base(timer, &flags);
646
647 if (timer_pending(timer)) {
648 detach_timer(timer, 0);
649 if (timer->expires == base->next_timer &&
650 !tbase_get_deferrable(timer->base))
651 base->next_timer = base->timer_jiffies;
652 ret = 1;
653 } else {
654 if (pending_only)
655 goto out_unlock;
656 }
657
658 debug_activate(timer, expires);
659
660 cpu = smp_processor_id();
661
662#if defined(CONFIG_NO_HZ) && defined(CONFIG_SMP)
663 if (!pinned && get_sysctl_timer_migration() && idle_cpu(cpu)) {
664 int preferred_cpu = get_nohz_load_balancer();
665
666 if (preferred_cpu >= 0)
667 cpu = preferred_cpu;
668 }
669#endif
670 new_base = per_cpu(tvec_bases, cpu);
671
672 if (base != new_base) {
673
674
675
676
677
678
679
680 if (likely(base->running_timer != timer)) {
681
682 timer_set_base(timer, NULL);
683 spin_unlock(&base->lock);
684 base = new_base;
685 spin_lock(&base->lock);
686 timer_set_base(timer, base);
687 }
688 }
689
690 timer->expires = expires;
691 if (time_before(timer->expires, base->next_timer) &&
692 !tbase_get_deferrable(timer->base))
693 base->next_timer = timer->expires;
694 internal_add_timer(base, timer);
695
696out_unlock:
697 spin_unlock_irqrestore(&base->lock, flags);
698
699 return ret;
700}
701
702
703
704
705
706
707
708
709
710
711
712int mod_timer_pending(struct timer_list *timer, unsigned long expires)
713{
714 return __mod_timer(timer, expires, true, TIMER_NOT_PINNED);
715}
716EXPORT_SYMBOL(mod_timer_pending);
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738int mod_timer(struct timer_list *timer, unsigned long expires)
739{
740
741
742
743
744
745 if (timer_pending(timer) && timer->expires == expires)
746 return 1;
747
748 return __mod_timer(timer, expires, false, TIMER_NOT_PINNED);
749}
750EXPORT_SYMBOL(mod_timer);
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765int mod_timer_pinned(struct timer_list *timer, unsigned long expires)
766{
767 if (timer->expires == expires && timer_pending(timer))
768 return 1;
769
770 return __mod_timer(timer, expires, false, TIMER_PINNED);
771}
772EXPORT_SYMBOL(mod_timer_pinned);
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788void add_timer(struct timer_list *timer)
789{
790 BUG_ON(timer_pending(timer));
791 mod_timer(timer, timer->expires);
792}
793EXPORT_SYMBOL(add_timer);
794
795
796
797
798
799
800
801
802void add_timer_on(struct timer_list *timer, int cpu)
803{
804 struct tvec_base *base = per_cpu(tvec_bases, cpu);
805 unsigned long flags;
806
807 timer_stats_timer_set_start_info(timer);
808 BUG_ON(timer_pending(timer) || !timer->function);
809 spin_lock_irqsave(&base->lock, flags);
810 timer_set_base(timer, base);
811 debug_activate(timer, timer->expires);
812 if (time_before(timer->expires, base->next_timer) &&
813 !tbase_get_deferrable(timer->base))
814 base->next_timer = timer->expires;
815 internal_add_timer(base, timer);
816
817
818
819
820
821
822
823
824 wake_up_idle_cpu(cpu);
825 spin_unlock_irqrestore(&base->lock, flags);
826}
827EXPORT_SYMBOL_GPL(add_timer_on);
828
829
830
831
832
833
834
835
836
837
838
839
840int del_timer(struct timer_list *timer)
841{
842 struct tvec_base *base;
843 unsigned long flags;
844 int ret = 0;
845
846 timer_stats_timer_clear_start_info(timer);
847 if (timer_pending(timer)) {
848 base = lock_timer_base(timer, &flags);
849 if (timer_pending(timer)) {
850 detach_timer(timer, 1);
851 if (timer->expires == base->next_timer &&
852 !tbase_get_deferrable(timer->base))
853 base->next_timer = base->timer_jiffies;
854 ret = 1;
855 }
856 spin_unlock_irqrestore(&base->lock, flags);
857 }
858
859 return ret;
860}
861EXPORT_SYMBOL(del_timer);
862
863#ifdef CONFIG_SMP
864
865
866
867
868
869
870
871
872
873int try_to_del_timer_sync(struct timer_list *timer)
874{
875 struct tvec_base *base;
876 unsigned long flags;
877 int ret = -1;
878
879 base = lock_timer_base(timer, &flags);
880
881 if (base->running_timer == timer)
882 goto out;
883
884 timer_stats_timer_clear_start_info(timer);
885 ret = 0;
886 if (timer_pending(timer)) {
887 detach_timer(timer, 1);
888 if (timer->expires == base->next_timer &&
889 !tbase_get_deferrable(timer->base))
890 base->next_timer = base->timer_jiffies;
891 ret = 1;
892 }
893out:
894 spin_unlock_irqrestore(&base->lock, flags);
895
896 return ret;
897}
898EXPORT_SYMBOL(try_to_del_timer_sync);
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917int del_timer_sync(struct timer_list *timer)
918{
919#ifdef CONFIG_LOCKDEP
920 unsigned long flags;
921
922 local_irq_save(flags);
923 lock_map_acquire(&timer->lockdep_map);
924 lock_map_release(&timer->lockdep_map);
925 local_irq_restore(flags);
926#endif
927
928 for (;;) {
929 int ret = try_to_del_timer_sync(timer);
930 if (ret >= 0)
931 return ret;
932 cpu_relax();
933 }
934}
935EXPORT_SYMBOL(del_timer_sync);
936#endif
937
938static int cascade(struct tvec_base *base, struct tvec *tv, int index)
939{
940
941 struct timer_list *timer, *tmp;
942 struct list_head tv_list;
943
944 list_replace_init(tv->vec + index, &tv_list);
945
946
947
948
949
950 list_for_each_entry_safe(timer, tmp, &tv_list, entry) {
951 BUG_ON(tbase_get_base(timer->base) != base);
952 internal_add_timer(base, timer);
953 }
954
955 return index;
956}
957
958#define INDEX(N) ((base->timer_jiffies >> (TVR_BITS + (N) * TVN_BITS)) & TVN_MASK)
959
960
961
962
963
964
965
966
967static inline void __run_timers(struct tvec_base *base)
968{
969 struct timer_list *timer;
970
971 spin_lock_irq(&base->lock);
972 while (time_after_eq(jiffies, base->timer_jiffies)) {
973 struct list_head work_list;
974 struct list_head *head = &work_list;
975 int index = base->timer_jiffies & TVR_MASK;
976
977
978
979
980 if (!index &&
981 (!cascade(base, &base->tv2, INDEX(0))) &&
982 (!cascade(base, &base->tv3, INDEX(1))) &&
983 !cascade(base, &base->tv4, INDEX(2)))
984 cascade(base, &base->tv5, INDEX(3));
985 ++base->timer_jiffies;
986 list_replace_init(base->tv1.vec + index, &work_list);
987 while (!list_empty(head)) {
988 void (*fn)(unsigned long);
989 unsigned long data;
990
991 timer = list_first_entry(head, struct timer_list,entry);
992 fn = timer->function;
993 data = timer->data;
994
995 timer_stats_account_timer(timer);
996
997 set_running_timer(base, timer);
998 detach_timer(timer, 1);
999
1000 spin_unlock_irq(&base->lock);
1001 {
1002 int preempt_count = preempt_count();
1003
1004#ifdef CONFIG_LOCKDEP
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014 struct lockdep_map lockdep_map =
1015 timer->lockdep_map;
1016#endif
1017
1018
1019
1020
1021
1022
1023 lock_map_acquire(&lockdep_map);
1024
1025 trace_timer_expire_entry(timer);
1026 fn(data);
1027 trace_timer_expire_exit(timer);
1028
1029 lock_map_release(&lockdep_map);
1030
1031 if (preempt_count != preempt_count()) {
1032 printk(KERN_ERR "huh, entered %p "
1033 "with preempt_count %08x, exited"
1034 " with %08x?\n",
1035 fn, preempt_count,
1036 preempt_count());
1037 BUG();
1038 }
1039 }
1040 spin_lock_irq(&base->lock);
1041 }
1042 }
1043 set_running_timer(base, NULL);
1044 spin_unlock_irq(&base->lock);
1045}
1046
1047#ifdef CONFIG_NO_HZ
1048
1049
1050
1051
1052
1053static unsigned long __next_timer_interrupt(struct tvec_base *base)
1054{
1055 unsigned long timer_jiffies = base->timer_jiffies;
1056 unsigned long expires = timer_jiffies + NEXT_TIMER_MAX_DELTA;
1057 int index, slot, array, found = 0;
1058 struct timer_list *nte;
1059 struct tvec *varray[4];
1060
1061
1062 index = slot = timer_jiffies & TVR_MASK;
1063 do {
1064 list_for_each_entry(nte, base->tv1.vec + slot, entry) {
1065 if (tbase_get_deferrable(nte->base))
1066 continue;
1067
1068 found = 1;
1069 expires = nte->expires;
1070
1071 if (!index || slot < index)
1072 goto cascade;
1073 return expires;
1074 }
1075 slot = (slot + 1) & TVR_MASK;
1076 } while (slot != index);
1077
1078cascade:
1079
1080 if (index)
1081 timer_jiffies += TVR_SIZE - index;
1082 timer_jiffies >>= TVR_BITS;
1083
1084
1085 varray[0] = &base->tv2;
1086 varray[1] = &base->tv3;
1087 varray[2] = &base->tv4;
1088 varray[3] = &base->tv5;
1089
1090 for (array = 0; array < 4; array++) {
1091 struct tvec *varp = varray[array];
1092
1093 index = slot = timer_jiffies & TVN_MASK;
1094 do {
1095 list_for_each_entry(nte, varp->vec + slot, entry) {
1096 if (tbase_get_deferrable(nte->base))
1097 continue;
1098
1099 found = 1;
1100 if (time_before(nte->expires, expires))
1101 expires = nte->expires;
1102 }
1103
1104
1105
1106
1107 if (found) {
1108
1109 if (!index || slot < index)
1110 break;
1111 return expires;
1112 }
1113 slot = (slot + 1) & TVN_MASK;
1114 } while (slot != index);
1115
1116 if (index)
1117 timer_jiffies += TVN_SIZE - index;
1118 timer_jiffies >>= TVN_BITS;
1119 }
1120 return expires;
1121}
1122
1123
1124
1125
1126
1127static unsigned long cmp_next_hrtimer_event(unsigned long now,
1128 unsigned long expires)
1129{
1130 ktime_t hr_delta = hrtimer_get_next_event();
1131 struct timespec tsdelta;
1132 unsigned long delta;
1133
1134 if (hr_delta.tv64 == KTIME_MAX)
1135 return expires;
1136
1137
1138
1139
1140 if (hr_delta.tv64 <= 0)
1141 return now + 1;
1142
1143 tsdelta = ktime_to_timespec(hr_delta);
1144 delta = timespec_to_jiffies(&tsdelta);
1145
1146
1147
1148
1149
1150 if (delta > NEXT_TIMER_MAX_DELTA)
1151 delta = NEXT_TIMER_MAX_DELTA;
1152
1153
1154
1155
1156
1157
1158
1159 if (delta < 1)
1160 delta = 1;
1161 now += delta;
1162 if (time_before(now, expires))
1163 return now;
1164 return expires;
1165}
1166
1167
1168
1169
1170
1171unsigned long get_next_timer_interrupt(unsigned long now)
1172{
1173 struct tvec_base *base = __get_cpu_var(tvec_bases);
1174 unsigned long expires;
1175
1176 spin_lock(&base->lock);
1177 if (time_before_eq(base->next_timer, base->timer_jiffies))
1178 base->next_timer = __next_timer_interrupt(base);
1179 expires = base->next_timer;
1180 spin_unlock(&base->lock);
1181
1182 if (time_before_eq(expires, now))
1183 return now;
1184
1185 return cmp_next_hrtimer_event(now, expires);
1186}
1187#endif
1188
1189
1190
1191
1192
1193void update_process_times(int user_tick)
1194{
1195 struct task_struct *p = current;
1196 int cpu = smp_processor_id();
1197
1198
1199 account_process_tick(p, user_tick);
1200 run_local_timers();
1201 rcu_check_callbacks(cpu, user_tick);
1202 printk_tick();
1203 perf_event_do_pending();
1204 scheduler_tick();
1205 run_posix_cpu_timers(p);
1206}
1207
1208
1209
1210
1211static void run_timer_softirq(struct softirq_action *h)
1212{
1213 struct tvec_base *base = __get_cpu_var(tvec_bases);
1214
1215 hrtimer_run_pending();
1216
1217 if (time_after_eq(jiffies, base->timer_jiffies))
1218 __run_timers(base);
1219}
1220
1221
1222
1223
1224void run_local_timers(void)
1225{
1226 hrtimer_run_queues();
1227 raise_softirq(TIMER_SOFTIRQ);
1228 softlockup_tick();
1229}
1230
1231
1232
1233
1234
1235
1236
1237void do_timer(unsigned long ticks)
1238{
1239 jiffies_64 += ticks;
1240 update_wall_time();
1241 calc_global_load();
1242}
1243
1244#ifdef __ARCH_WANT_SYS_ALARM
1245
1246
1247
1248
1249
1250SYSCALL_DEFINE1(alarm, unsigned int, seconds)
1251{
1252 return alarm_setitimer(seconds);
1253}
1254
1255#endif
1256
1257#ifndef __alpha__
1258
1259
1260
1261
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273SYSCALL_DEFINE0(getpid)
1274{
1275 return task_tgid_vnr(current);
1276}
1277
1278
1279
1280
1281
1282
1283
1284SYSCALL_DEFINE0(getppid)
1285{
1286 int pid;
1287
1288 rcu_read_lock();
1289 pid = task_tgid_vnr(current->real_parent);
1290 rcu_read_unlock();
1291
1292 return pid;
1293}
1294
1295SYSCALL_DEFINE0(getuid)
1296{
1297
1298 return current_uid();
1299}
1300
1301SYSCALL_DEFINE0(geteuid)
1302{
1303
1304 return current_euid();
1305}
1306
1307SYSCALL_DEFINE0(getgid)
1308{
1309
1310 return current_gid();
1311}
1312
1313SYSCALL_DEFINE0(getegid)
1314{
1315
1316 return current_egid();
1317}
1318
1319#endif
1320
1321static void process_timeout(unsigned long __data)
1322{
1323 wake_up_process((struct task_struct *)__data);
1324}
1325
1326
1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
1341
1342
1343
1344
1345
1346
1347
1348
1349
1350
1351
1352signed long __sched schedule_timeout(signed long timeout)
1353{
1354 struct timer_list timer;
1355 unsigned long expire;
1356
1357 switch (timeout)
1358 {
1359 case MAX_SCHEDULE_TIMEOUT:
1360
1361
1362
1363
1364
1365
1366
1367 schedule();
1368 goto out;
1369 default:
1370
1371
1372
1373
1374
1375
1376
1377 if (timeout < 0) {
1378 printk(KERN_ERR "schedule_timeout: wrong timeout "
1379 "value %lx\n", timeout);
1380 dump_stack();
1381 current->state = TASK_RUNNING;
1382 goto out;
1383 }
1384 }
1385
1386 expire = timeout + jiffies;
1387
1388 setup_timer_on_stack(&timer, process_timeout, (unsigned long)current);
1389 __mod_timer(&timer, expire, false, TIMER_NOT_PINNED);
1390 schedule();
1391 del_singleshot_timer_sync(&timer);
1392
1393
1394 destroy_timer_on_stack(&timer);
1395
1396 timeout = expire - jiffies;
1397
1398 out:
1399 return timeout < 0 ? 0 : timeout;
1400}
1401EXPORT_SYMBOL(schedule_timeout);
1402
1403
1404
1405
1406
1407signed long __sched schedule_timeout_interruptible(signed long timeout)
1408{
1409 __set_current_state(TASK_INTERRUPTIBLE);
1410 return schedule_timeout(timeout);
1411}
1412EXPORT_SYMBOL(schedule_timeout_interruptible);
1413
1414signed long __sched schedule_timeout_killable(signed long timeout)
1415{
1416 __set_current_state(TASK_KILLABLE);
1417 return schedule_timeout(timeout);
1418}
1419EXPORT_SYMBOL(schedule_timeout_killable);
1420
1421signed long __sched schedule_timeout_uninterruptible(signed long timeout)
1422{
1423 __set_current_state(TASK_UNINTERRUPTIBLE);
1424 return schedule_timeout(timeout);
1425}
1426EXPORT_SYMBOL(schedule_timeout_uninterruptible);
1427
1428
1429SYSCALL_DEFINE0(gettid)
1430{
1431 return task_pid_vnr(current);
1432}
1433
1434
1435
1436
1437
1438int do_sysinfo(struct sysinfo *info)
1439{
1440 unsigned long mem_total, sav_total;
1441 unsigned int mem_unit, bitcount;
1442 struct timespec tp;
1443
1444 memset(info, 0, sizeof(struct sysinfo));
1445
1446 ktime_get_ts(&tp);
1447 monotonic_to_bootbased(&tp);
1448 info->uptime = tp.tv_sec + (tp.tv_nsec ? 1 : 0);
1449
1450 get_avenrun(info->loads, 0, SI_LOAD_SHIFT - FSHIFT);
1451
1452 info->procs = nr_threads;
1453
1454 si_meminfo(info);
1455 si_swapinfo(info);
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466 mem_total = info->totalram + info->totalswap;
1467 if (mem_total < info->totalram || mem_total < info->totalswap)
1468 goto out;
1469 bitcount = 0;
1470 mem_unit = info->mem_unit;
1471 while (mem_unit > 1) {
1472 bitcount++;
1473 mem_unit >>= 1;
1474 sav_total = mem_total;
1475 mem_total <<= 1;
1476 if (mem_total < sav_total)
1477 goto out;
1478 }
1479
1480
1481
1482
1483
1484
1485
1486
1487 info->mem_unit = 1;
1488 info->totalram <<= bitcount;
1489 info->freeram <<= bitcount;
1490 info->sharedram <<= bitcount;
1491 info->bufferram <<= bitcount;
1492 info->totalswap <<= bitcount;
1493 info->freeswap <<= bitcount;
1494 info->totalhigh <<= bitcount;
1495 info->freehigh <<= bitcount;
1496
1497out:
1498 return 0;
1499}
1500
1501SYSCALL_DEFINE1(sysinfo, struct sysinfo __user *, info)
1502{
1503 struct sysinfo val;
1504
1505 do_sysinfo(&val);
1506
1507 if (copy_to_user(info, &val, sizeof(struct sysinfo)))
1508 return -EFAULT;
1509
1510 return 0;
1511}
1512
1513static int __cpuinit init_timers_cpu(int cpu)
1514{
1515 int j;
1516 struct tvec_base *base;
1517 static char __cpuinitdata tvec_base_done[NR_CPUS];
1518
1519 if (!tvec_base_done[cpu]) {
1520 static char boot_done;
1521
1522 if (boot_done) {
1523
1524
1525
1526 base = kmalloc_node(sizeof(*base),
1527 GFP_KERNEL | __GFP_ZERO,
1528 cpu_to_node(cpu));
1529 if (!base)
1530 return -ENOMEM;
1531
1532
1533 if (tbase_get_deferrable(base)) {
1534 WARN_ON(1);
1535 kfree(base);
1536 return -ENOMEM;
1537 }
1538 per_cpu(tvec_bases, cpu) = base;
1539 } else {
1540
1541
1542
1543
1544
1545
1546 boot_done = 1;
1547 base = &boot_tvec_bases;
1548 }
1549 tvec_base_done[cpu] = 1;
1550 } else {
1551 base = per_cpu(tvec_bases, cpu);
1552 }
1553
1554 spin_lock_init(&base->lock);
1555
1556 for (j = 0; j < TVN_SIZE; j++) {
1557 INIT_LIST_HEAD(base->tv5.vec + j);
1558 INIT_LIST_HEAD(base->tv4.vec + j);
1559 INIT_LIST_HEAD(base->tv3.vec + j);
1560 INIT_LIST_HEAD(base->tv2.vec + j);
1561 }
1562 for (j = 0; j < TVR_SIZE; j++)
1563 INIT_LIST_HEAD(base->tv1.vec + j);
1564
1565 base->timer_jiffies = jiffies;
1566 base->next_timer = base->timer_jiffies;
1567 return 0;
1568}
1569
1570#ifdef CONFIG_HOTPLUG_CPU
1571static void migrate_timer_list(struct tvec_base *new_base, struct list_head *head)
1572{
1573 struct timer_list *timer;
1574
1575 while (!list_empty(head)) {
1576 timer = list_first_entry(head, struct timer_list, entry);
1577 detach_timer(timer, 0);
1578 timer_set_base(timer, new_base);
1579 if (time_before(timer->expires, new_base->next_timer) &&
1580 !tbase_get_deferrable(timer->base))
1581 new_base->next_timer = timer->expires;
1582 internal_add_timer(new_base, timer);
1583 }
1584}
1585
1586static void __cpuinit migrate_timers(int cpu)
1587{
1588 struct tvec_base *old_base;
1589 struct tvec_base *new_base;
1590 int i;
1591
1592 BUG_ON(cpu_online(cpu));
1593 old_base = per_cpu(tvec_bases, cpu);
1594 new_base = get_cpu_var(tvec_bases);
1595
1596
1597
1598
1599 spin_lock_irq(&new_base->lock);
1600 spin_lock_nested(&old_base->lock, SINGLE_DEPTH_NESTING);
1601
1602 BUG_ON(old_base->running_timer);
1603
1604 for (i = 0; i < TVR_SIZE; i++)
1605 migrate_timer_list(new_base, old_base->tv1.vec + i);
1606 for (i = 0; i < TVN_SIZE; i++) {
1607 migrate_timer_list(new_base, old_base->tv2.vec + i);
1608 migrate_timer_list(new_base, old_base->tv3.vec + i);
1609 migrate_timer_list(new_base, old_base->tv4.vec + i);
1610 migrate_timer_list(new_base, old_base->tv5.vec + i);
1611 }
1612
1613 spin_unlock(&old_base->lock);
1614 spin_unlock_irq(&new_base->lock);
1615 put_cpu_var(tvec_bases);
1616}
1617#endif
1618
1619static int __cpuinit timer_cpu_notify(struct notifier_block *self,
1620 unsigned long action, void *hcpu)
1621{
1622 long cpu = (long)hcpu;
1623 switch(action) {
1624 case CPU_UP_PREPARE:
1625 case CPU_UP_PREPARE_FROZEN:
1626 if (init_timers_cpu(cpu) < 0)
1627 return NOTIFY_BAD;
1628 break;
1629#ifdef CONFIG_HOTPLUG_CPU
1630 case CPU_DEAD:
1631 case CPU_DEAD_FROZEN:
1632 migrate_timers(cpu);
1633 break;
1634#endif
1635 default:
1636 break;
1637 }
1638 return NOTIFY_OK;
1639}
1640
1641static struct notifier_block __cpuinitdata timers_nb = {
1642 .notifier_call = timer_cpu_notify,
1643};
1644
1645
1646void __init init_timers(void)
1647{
1648 int err = timer_cpu_notify(&timers_nb, (unsigned long)CPU_UP_PREPARE,
1649 (void *)(long)smp_processor_id());
1650
1651 init_timer_stats();
1652
1653 BUG_ON(err == NOTIFY_BAD);
1654 register_cpu_notifier(&timers_nb);
1655 open_softirq(TIMER_SOFTIRQ, run_timer_softirq);
1656}
1657
1658
1659
1660
1661
1662void msleep(unsigned int msecs)
1663{
1664 unsigned long timeout = msecs_to_jiffies(msecs) + 1;
1665
1666 while (timeout)
1667 timeout = schedule_timeout_uninterruptible(timeout);
1668}
1669
1670EXPORT_SYMBOL(msleep);
1671
1672
1673
1674
1675
1676unsigned long msleep_interruptible(unsigned int msecs)
1677{
1678 unsigned long timeout = msecs_to_jiffies(msecs) + 1;
1679
1680 while (timeout && !signal_pending(current))
1681 timeout = schedule_timeout_interruptible(timeout);
1682 return jiffies_to_msecs(timeout);
1683}
1684
1685EXPORT_SYMBOL(msleep_interruptible);
1686