perf: Add perf_event::child_count

Only child counters adding back their values into the parent counter
are responsible for cross-cpu updates to event->count.

So if we pull that out into a new child_count variable, we get an
event->count that is only modified locally.
......@@ -671,6 +671,7 @@ struct perf_event {
enum perf_event_active_state state;
unsigned int attach_state;
atomic64_t count;
atomic64_t child_count;
* These are the total time in nanoseconds that the event
......@@ -1738,7 +1738,7 @@ static void __perf_event_read(void *info)
static inline u64 perf_event_count(struct perf_event *event)
return atomic64_read(&event->count);
return atomic64_read(&event->count) + atomic64_read(&event->child_count);
static u64 perf_event_read(struct perf_event *event)
......@@ -5379,7 +5379,7 @@ static void sync_child_event(struct perf_event *child_event,
* Add back the child's count to the parent's count:
atomic64_add(child_val, &parent_event->count);
atomic64_add(child_val, &parent_event->child_count);
