diff options
| author | Mark Brown <broonie@kernel.org> | 2016-02-09 21:20:39 +0300 | 
|---|---|---|
| committer | Mark Brown <broonie@kernel.org> | 2016-02-09 21:20:39 +0300 | 
| commit | fcdcc79628a1919bde9acf239e364f65bab6327c (patch) | |
| tree | 5499be387cf3028c90ac083b1cf866ebed7bf7e0 /include/linux/cgroup-defs.h | |
| parent | 7a8d44bc89e5cddcd5c0704a11a90484d36ba6ba (diff) | |
| parent | a0a90718f18264dc904d34a580f332006f5561e9 (diff) | |
| download | linux-fcdcc79628a1919bde9acf239e364f65bab6327c.tar.xz | |
Merge branch 'topic/acpi' of git://git.kernel.org/pub/scm/linux/kernel/git/broonie/spi into spi-pxa2xx
Diffstat (limited to 'include/linux/cgroup-defs.h')
| -rw-r--r-- | include/linux/cgroup-defs.h | 152 | 
1 files changed, 132 insertions, 20 deletions
| diff --git a/include/linux/cgroup-defs.h b/include/linux/cgroup-defs.h index 60d44b26276d..7f540f7f588d 100644 --- a/include/linux/cgroup-defs.h +++ b/include/linux/cgroup-defs.h @@ -34,17 +34,12 @@ struct seq_file;  /* define the enumeration of all cgroup subsystems */  #define SUBSYS(_x) _x ## _cgrp_id, -#define SUBSYS_TAG(_t) CGROUP_ ## _t, \ -	__unused_tag_ ## _t = CGROUP_ ## _t - 1,  enum cgroup_subsys_id {  #include <linux/cgroup_subsys.h>  	CGROUP_SUBSYS_COUNT,  }; -#undef SUBSYS_TAG  #undef SUBSYS -#define CGROUP_CANFORK_COUNT (CGROUP_CANFORK_END - CGROUP_CANFORK_START) -  /* bits in struct cgroup_subsys_state flags field */  enum {  	CSS_NO_REF	= (1 << 0), /* no reference counting for this css */ @@ -66,7 +61,6 @@ enum {  /* cgroup_root->flags */  enum { -	CGRP_ROOT_SANE_BEHAVIOR	= (1 << 0), /* __DEVEL__sane_behavior specified */  	CGRP_ROOT_NOPREFIX	= (1 << 1), /* mounted subsystems have no named prefix */  	CGRP_ROOT_XATTR		= (1 << 2), /* supports extended attributes */  }; @@ -90,7 +84,6 @@ enum {   */  struct cgroup_file {  	/* do not access any fields from outside cgroup core */ -	struct list_head node;			/* anchored at css->files */  	struct kernfs_node *kn;  }; @@ -134,9 +127,6 @@ struct cgroup_subsys_state {  	 */  	u64 serial_nr; -	/* all cgroup_files associated with this css */ -	struct list_head files; -  	/* percpu_ref killing and RCU release */  	struct rcu_head rcu_head;  	struct work_struct destroy_work; @@ -235,6 +225,14 @@ struct cgroup {  	int id;  	/* +	 * The depth this cgroup is at.  The root is at depth zero and each +	 * step down the hierarchy increments the level.  This along with +	 * ancestor_ids[] can determine whether a given cgroup is a +	 * descendant of another without traversing the hierarchy. +	 */ +	int level; + +	/*  	 * Each non-empty css_set associated with this cgroup contributes  	 * one to populated_cnt.  All children with non-zero popuplated_cnt  	 * of their own contribute one.  The count is zero iff there's no @@ -289,6 +287,9 @@ struct cgroup {  	/* used to schedule release agent */  	struct work_struct release_agent_work; + +	/* ids of the ancestors at each level including self */ +	int ancestor_ids[];  };  /* @@ -308,6 +309,9 @@ struct cgroup_root {  	/* The root cgroup.  Root is destroyed on its release. */  	struct cgroup cgrp; +	/* for cgrp->ancestor_ids[0] */ +	int cgrp_ancestor_id_storage; +  	/* Number of cgroups in the hierarchy, used only for /proc/cgroups */  	atomic_t nr_cgrps; @@ -426,15 +430,12 @@ struct cgroup_subsys {  	void (*css_reset)(struct cgroup_subsys_state *css);  	void (*css_e_css_changed)(struct cgroup_subsys_state *css); -	int (*can_attach)(struct cgroup_subsys_state *css, -			  struct cgroup_taskset *tset); -	void (*cancel_attach)(struct cgroup_subsys_state *css, -			      struct cgroup_taskset *tset); -	void (*attach)(struct cgroup_subsys_state *css, -		       struct cgroup_taskset *tset); -	int (*can_fork)(struct task_struct *task, void **priv_p); -	void (*cancel_fork)(struct task_struct *task, void *priv); -	void (*fork)(struct task_struct *task, void *priv); +	int (*can_attach)(struct cgroup_taskset *tset); +	void (*cancel_attach)(struct cgroup_taskset *tset); +	void (*attach)(struct cgroup_taskset *tset); +	int (*can_fork)(struct task_struct *task); +	void (*cancel_fork)(struct task_struct *task); +	void (*fork)(struct task_struct *task);  	void (*exit)(struct task_struct *task);  	void (*free)(struct task_struct *task);  	void (*bind)(struct cgroup_subsys_state *root_css); @@ -520,7 +521,6 @@ static inline void cgroup_threadgroup_change_end(struct task_struct *tsk)  #else	/* CONFIG_CGROUPS */ -#define CGROUP_CANFORK_COUNT 0  #define CGROUP_SUBSYS_COUNT 0  static inline void cgroup_threadgroup_change_begin(struct task_struct *tsk) {} @@ -528,4 +528,116 @@ static inline void cgroup_threadgroup_change_end(struct task_struct *tsk) {}  #endif	/* CONFIG_CGROUPS */ +#ifdef CONFIG_SOCK_CGROUP_DATA + +/* + * sock_cgroup_data is embedded at sock->sk_cgrp_data and contains + * per-socket cgroup information except for memcg association. + * + * On legacy hierarchies, net_prio and net_cls controllers directly set + * attributes on each sock which can then be tested by the network layer. + * On the default hierarchy, each sock is associated with the cgroup it was + * created in and the networking layer can match the cgroup directly. + * + * To avoid carrying all three cgroup related fields separately in sock, + * sock_cgroup_data overloads (prioidx, classid) and the cgroup pointer. + * On boot, sock_cgroup_data records the cgroup that the sock was created + * in so that cgroup2 matches can be made; however, once either net_prio or + * net_cls starts being used, the area is overriden to carry prioidx and/or + * classid.  The two modes are distinguished by whether the lowest bit is + * set.  Clear bit indicates cgroup pointer while set bit prioidx and + * classid. + * + * While userland may start using net_prio or net_cls at any time, once + * either is used, cgroup2 matching no longer works.  There is no reason to + * mix the two and this is in line with how legacy and v2 compatibility is + * handled.  On mode switch, cgroup references which are already being + * pointed to by socks may be leaked.  While this can be remedied by adding + * synchronization around sock_cgroup_data, given that the number of leaked + * cgroups is bound and highly unlikely to be high, this seems to be the + * better trade-off. + */ +struct sock_cgroup_data { +	union { +#ifdef __LITTLE_ENDIAN +		struct { +			u8	is_data; +			u8	padding; +			u16	prioidx; +			u32	classid; +		} __packed; +#else +		struct { +			u32	classid; +			u16	prioidx; +			u8	padding; +			u8	is_data; +		} __packed; +#endif +		u64		val; +	}; +}; + +/* + * There's a theoretical window where the following accessors race with + * updaters and return part of the previous pointer as the prioidx or + * classid.  Such races are short-lived and the result isn't critical. + */ +static inline u16 sock_cgroup_prioidx(struct sock_cgroup_data *skcd) +{ +	/* fallback to 1 which is always the ID of the root cgroup */ +	return (skcd->is_data & 1) ? skcd->prioidx : 1; +} + +static inline u32 sock_cgroup_classid(struct sock_cgroup_data *skcd) +{ +	/* fallback to 0 which is the unconfigured default classid */ +	return (skcd->is_data & 1) ? skcd->classid : 0; +} + +/* + * If invoked concurrently, the updaters may clobber each other.  The + * caller is responsible for synchronization. + */ +static inline void sock_cgroup_set_prioidx(struct sock_cgroup_data *skcd, +					   u16 prioidx) +{ +	struct sock_cgroup_data skcd_buf = {{ .val = READ_ONCE(skcd->val) }}; + +	if (sock_cgroup_prioidx(&skcd_buf) == prioidx) +		return; + +	if (!(skcd_buf.is_data & 1)) { +		skcd_buf.val = 0; +		skcd_buf.is_data = 1; +	} + +	skcd_buf.prioidx = prioidx; +	WRITE_ONCE(skcd->val, skcd_buf.val);	/* see sock_cgroup_ptr() */ +} + +static inline void sock_cgroup_set_classid(struct sock_cgroup_data *skcd, +					   u32 classid) +{ +	struct sock_cgroup_data skcd_buf = {{ .val = READ_ONCE(skcd->val) }}; + +	if (sock_cgroup_classid(&skcd_buf) == classid) +		return; + +	if (!(skcd_buf.is_data & 1)) { +		skcd_buf.val = 0; +		skcd_buf.is_data = 1; +	} + +	skcd_buf.classid = classid; +	WRITE_ONCE(skcd->val, skcd_buf.val);	/* see sock_cgroup_ptr() */ +} + +#else	/* CONFIG_SOCK_CGROUP_DATA */ + +struct sock_cgroup_data { +}; + +#endif	/* CONFIG_SOCK_CGROUP_DATA */ +  #endif	/* _LINUX_CGROUP_DEFS_H */ | 
