2
0

cgroup.go 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383
  1. package worker
  2. import (
  3. "errors"
  4. "fmt"
  5. "io"
  6. "os"
  7. "os/exec"
  8. "path/filepath"
  9. "syscall"
  10. "time"
  11. "golang.org/x/sys/unix"
  12. cgroups "github.com/containerd/cgroups/v3"
  13. cgv1 "github.com/containerd/cgroups/v3/cgroup1"
  14. cgv2 "github.com/containerd/cgroups/v3/cgroup2"
  15. "github.com/moby/moby/pkg/reexec"
  16. contspecs "github.com/opencontainers/runtime-spec/specs-go"
  17. )
  18. type cgroupHook struct {
  19. emptyHook
  20. cgCfg cgroupConfig
  21. memLimit MemBytes
  22. cgMgrV1 cgv1.Cgroup
  23. cgMgrV2 *cgv2.Manager
  24. }
  25. type execCmd string
  26. const (
  27. cmdCont execCmd = "cont"
  28. cmdAbrt execCmd = "abrt"
  29. )
  30. func init() {
  31. reexec.Register("tunasync-exec", waitExec)
  32. }
  33. func waitExec() {
  34. binary, err := exec.LookPath(os.Args[1])
  35. if err != nil {
  36. panic(err)
  37. }
  38. pipe := os.NewFile(3, "pipe")
  39. if pipe != nil {
  40. if _, err := pipe.Stat(); err == nil {
  41. cmdBytes, err := io.ReadAll(pipe)
  42. if err != nil {
  43. panic(err)
  44. }
  45. if err := pipe.Close(); err != nil {
  46. }
  47. cmd := execCmd(string(cmdBytes))
  48. switch cmd {
  49. case cmdAbrt:
  50. fallthrough
  51. default:
  52. panic("Exited on request")
  53. case cmdCont:
  54. }
  55. }
  56. }
  57. args := os.Args[1:]
  58. env := os.Environ()
  59. if err := syscall.Exec(binary, args, env); err != nil {
  60. panic(err)
  61. }
  62. panic("Exec failed.")
  63. }
  64. func initCgroup(cfg *cgroupConfig) error {
  65. logger.Debugf("Initializing cgroup")
  66. baseGroup := cfg.Group
  67. //subsystem := cfg.Subsystem
  68. // If baseGroup is empty, it implies using the cgroup of the current process
  69. // otherwise, it refers to a absolute group path
  70. if baseGroup != "" {
  71. baseGroup = filepath.Join("/", baseGroup)
  72. }
  73. cfg.isUnified = cgroups.Mode() == cgroups.Unified
  74. if cfg.isUnified {
  75. logger.Debugf("Cgroup V2 detected")
  76. g := baseGroup
  77. if g == "" {
  78. logger.Debugf("Detecting my cgroup path")
  79. var err error
  80. if g, err = cgv2.NestedGroupPath(""); err != nil {
  81. return err
  82. }
  83. }
  84. logger.Infof("Using cgroup path: %s", g)
  85. var err error
  86. if cfg.cgMgrV2, err = cgv2.Load(g); err != nil {
  87. return err
  88. }
  89. if baseGroup == "" {
  90. logger.Debugf("Creating a sub group and move all processes into it")
  91. wkrMgr, err := cfg.cgMgrV2.NewChild("__worker", nil)
  92. if err != nil {
  93. return err
  94. }
  95. for {
  96. logger.Debugf("Reading pids")
  97. procs, err := cfg.cgMgrV2.Procs(false)
  98. if err != nil {
  99. logger.Errorf("Cannot read pids in that group")
  100. return err
  101. }
  102. if len(procs) == 0 {
  103. break
  104. }
  105. for _, p := range procs {
  106. if err := wkrMgr.AddProc(p); err != nil {
  107. if errors.Is(err, syscall.ESRCH) {
  108. logger.Debugf("Write pid %d to sub group failed: process vanished, ignoring")
  109. } else {
  110. return err
  111. }
  112. }
  113. }
  114. }
  115. } else {
  116. logger.Debugf("Trying to create a sub group in that group")
  117. testMgr, err := cfg.cgMgrV2.NewChild("__test", nil)
  118. if err != nil {
  119. logger.Errorf("Cannot create a sub group in the cgroup")
  120. return err
  121. }
  122. if err := testMgr.Delete(); err != nil {
  123. return err
  124. }
  125. procs, err := cfg.cgMgrV2.Procs(false)
  126. if err != nil {
  127. logger.Errorf("Cannot read pids in that group")
  128. return err
  129. }
  130. if len(procs) != 0 {
  131. return fmt.Errorf("There are remaining processes in cgroup %s", baseGroup)
  132. }
  133. }
  134. } else {
  135. logger.Debugf("Cgroup V1 detected")
  136. var pather cgv1.Path
  137. if baseGroup != "" {
  138. pather = cgv1.StaticPath(baseGroup)
  139. } else {
  140. pather = (func(p cgv1.Path) cgv1.Path {
  141. return func(subsys cgv1.Name) (string, error) {
  142. path, err := p(subsys)
  143. if err != nil {
  144. return "", err
  145. }
  146. if path == "/" {
  147. return "", cgv1.ErrControllerNotActive
  148. }
  149. return path, err
  150. }
  151. })(cgv1.NestedPath(""))
  152. }
  153. logger.Infof("Loading cgroup")
  154. var err error
  155. if cfg.cgMgrV1, err = cgv1.Load(pather, func(cfg *cgv1.InitConfig) error {
  156. cfg.InitCheck = cgv1.AllowAny
  157. return nil
  158. }); err != nil {
  159. return err
  160. }
  161. logger.Debugf("Available subsystems:")
  162. for _, subsys := range cfg.cgMgrV1.Subsystems() {
  163. p, err := pather(subsys.Name())
  164. if err != nil {
  165. return err
  166. }
  167. logger.Debugf("%s: %s", subsys.Name(), p)
  168. }
  169. if baseGroup == "" {
  170. logger.Debugf("Creating a sub group and move all processes into it")
  171. wkrMgr, err := cfg.cgMgrV1.New("__worker", &contspecs.LinuxResources{})
  172. if err != nil {
  173. return err
  174. }
  175. for _, subsys := range cfg.cgMgrV1.Subsystems() {
  176. logger.Debugf("Reading pids for subsystem %s", subsys.Name())
  177. for {
  178. procs, err := cfg.cgMgrV1.Processes(subsys.Name(), false)
  179. if err != nil {
  180. p, err := pather(subsys.Name())
  181. if err != nil {
  182. return err
  183. }
  184. logger.Errorf("Cannot read pids in group %s of subsystem %s", p, subsys.Name())
  185. return err
  186. }
  187. if len(procs) == 0 {
  188. break
  189. }
  190. for _, proc := range procs {
  191. if err := wkrMgr.Add(proc); err != nil {
  192. if errors.Is(err, syscall.ESRCH) {
  193. logger.Debugf("Write pid %d to sub group failed: process vanished, ignoring")
  194. } else {
  195. return err
  196. }
  197. }
  198. }
  199. }
  200. }
  201. } else {
  202. logger.Debugf("Trying to create a sub group in that group")
  203. testMgr, err := cfg.cgMgrV1.New("__test", &contspecs.LinuxResources{})
  204. if err != nil {
  205. logger.Errorf("Cannot create a sub group in the cgroup")
  206. return err
  207. }
  208. if err := testMgr.Delete(); err != nil {
  209. return err
  210. }
  211. for _, subsys := range cfg.cgMgrV1.Subsystems() {
  212. logger.Debugf("Reading pids for subsystem %s", subsys.Name())
  213. procs, err := cfg.cgMgrV1.Processes(subsys.Name(), false)
  214. if err != nil {
  215. p, err := pather(subsys.Name())
  216. if err != nil {
  217. return err
  218. }
  219. logger.Errorf("Cannot read pids in group %s of subsystem %s", p, subsys.Name())
  220. return err
  221. }
  222. if len(procs) != 0 {
  223. p, err := pather(subsys.Name())
  224. if err != nil {
  225. return err
  226. }
  227. return fmt.Errorf("There are remaining processes in cgroup %s of subsystem %s", p, subsys.Name())
  228. }
  229. }
  230. }
  231. }
  232. return nil
  233. }
  234. func newCgroupHook(p mirrorProvider, cfg cgroupConfig, memLimit MemBytes) *cgroupHook {
  235. return &cgroupHook{
  236. emptyHook: emptyHook{
  237. provider: p,
  238. },
  239. cgCfg: cfg,
  240. memLimit: memLimit,
  241. }
  242. }
  243. func (c *cgroupHook) preExec() error {
  244. if c.cgCfg.isUnified {
  245. logger.Debugf("Creating v2 cgroup for task %s", c.provider.Name())
  246. var resSet *cgv2.Resources
  247. if c.memLimit != 0 {
  248. resSet = &cgv2.Resources{
  249. Memory: &cgv2.Memory{
  250. Max: func(i int64) *int64 { return &i }(c.memLimit.Value()),
  251. },
  252. }
  253. }
  254. subMgr, err := c.cgCfg.cgMgrV2.NewChild(c.provider.Name(), resSet)
  255. if err != nil {
  256. logger.Errorf("Failed to create cgroup for task %s: %s", c.provider.Name(), err.Error())
  257. return err
  258. }
  259. c.cgMgrV2 = subMgr
  260. } else {
  261. logger.Debugf("Creating v1 cgroup for task %s", c.provider.Name())
  262. var resSet contspecs.LinuxResources
  263. if c.memLimit != 0 {
  264. resSet = contspecs.LinuxResources{
  265. Memory: &contspecs.LinuxMemory{
  266. Limit: func(i int64) *int64 { return &i }(c.memLimit.Value()),
  267. },
  268. }
  269. }
  270. subMgr, err := c.cgCfg.cgMgrV1.New(c.provider.Name(), &resSet)
  271. if err != nil {
  272. logger.Errorf("Failed to create cgroup for task %s: %s", c.provider.Name(), err.Error())
  273. return err
  274. }
  275. c.cgMgrV1 = subMgr
  276. }
  277. return nil
  278. }
  279. func (c *cgroupHook) postExec() error {
  280. err := c.killAll()
  281. if err != nil {
  282. logger.Errorf("Error killing tasks: %s", err.Error())
  283. }
  284. if c.cgCfg.isUnified {
  285. logger.Debugf("Deleting v2 cgroup for task %s", c.provider.Name())
  286. if err := c.cgMgrV2.Delete(); err != nil {
  287. logger.Errorf("Failed to delete cgroup for task %s: %s", c.provider.Name(), err.Error())
  288. return err
  289. }
  290. c.cgMgrV2 = nil
  291. } else {
  292. logger.Debugf("Deleting v1 cgroup for task %s", c.provider.Name())
  293. if err := c.cgMgrV1.Delete(); err != nil {
  294. logger.Errorf("Failed to delete cgroup for task %s: %s", c.provider.Name(), err.Error())
  295. return err
  296. }
  297. c.cgMgrV1 = nil
  298. }
  299. return nil
  300. }
  301. func (c *cgroupHook) killAll() error {
  302. if c.cgCfg.isUnified {
  303. if c.cgMgrV2 == nil {
  304. return nil
  305. }
  306. } else {
  307. if c.cgMgrV1 == nil {
  308. return nil
  309. }
  310. }
  311. readTaskList := func() ([]int, error) {
  312. taskList := []int{}
  313. if c.cgCfg.isUnified {
  314. procs, err := c.cgMgrV2.Procs(false)
  315. if err != nil {
  316. return []int{}, err
  317. }
  318. for _, proc := range procs {
  319. taskList = append(taskList, int(proc))
  320. }
  321. } else {
  322. taskSet := make(map[int]struct{})
  323. for _, subsys := range c.cgMgrV1.Subsystems() {
  324. procs, err := c.cgMgrV1.Processes(subsys.Name(), false)
  325. if err != nil {
  326. return []int{}, err
  327. }
  328. for _, proc := range procs {
  329. taskSet[proc.Pid] = struct{}{}
  330. }
  331. }
  332. for proc := range taskSet {
  333. taskList = append(taskList, proc)
  334. }
  335. }
  336. return taskList, nil
  337. }
  338. for i := 0; i < 4; i++ {
  339. if i == 3 {
  340. return errors.New("Unable to kill all child tasks")
  341. }
  342. taskList, err := readTaskList()
  343. if err != nil {
  344. return err
  345. }
  346. if len(taskList) == 0 {
  347. return nil
  348. }
  349. for _, pid := range taskList {
  350. // TODO: deal with defunct processes
  351. logger.Debugf("Killing process: %d", pid)
  352. unix.Kill(pid, syscall.SIGKILL)
  353. }
  354. // sleep 10ms for the first round, and 1.01s, 2.01s, 3.01s for the rest
  355. time.Sleep(time.Duration(i)*time.Second + 10*time.Millisecond)
  356. }
  357. return nil
  358. }