Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
S
slapos.core
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Léo-Paul Géneau
slapos.core
Commits
8bb366ab
Commit
8bb366ab
authored
Jun 28, 2017
by
Tomáš Peterka
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
[manager.cpuset] Split CPU cores half-half between shared and exclusive
parent
d041e861
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
102 additions
and
55 deletions
+102
-55
slapos/manager/cpuset.py
slapos/manager/cpuset.py
+72
-43
slapos/tests/slapformat.py
slapos/tests/slapformat.py
+30
-12
No files found.
slapos/manager/cpuset.py
View file @
8bb366ab
# coding: utf-8
# coding: utf-8
import
logging
import
logging
import
math
import
os
import
os
import
os.path
import
os.path
import
pwd
import
pwd
...
@@ -45,20 +46,39 @@ class Manager(object):
...
@@ -45,20 +46,39 @@ class Manager(object):
logger
.
warning
(
"CPUSet Manager cannot format computer because cgroups do not exist."
)
logger
.
warning
(
"CPUSet Manager cannot format computer because cgroups do not exist."
)
return
return
for
cpu
in
self
.
_cpu_id_list
():
def
create_cpuset_subtree
(
name
,
cpu_id_list
):
"""Create root for cpuset with per-CPU folders."""
if
not
cpu_id_list
:
logger
.
warning
(
"Too less cores - cannot reserve any for
\
"
{}
\
"
"
.
format
(
name
))
return
root_path
=
self
.
_prepare_folder
(
os
.
path
.
join
(
self
.
cpuset_path
,
name
))
with
open
(
root_path
+
"/cpuset.cpus"
,
"wt"
)
as
fx
:
# this cgroup manages all `name` cpus
if
len
(
cpu_id_list
)
==
1
:
fx
.
write
(
str
(
cpu_id_list
[
0
]))
else
:
fx
.
write
(
"{:d}-{:d}"
.
format
(
cpu_id_list
[
0
],
cpu_id_list
[
-
1
]))
create_cpuset_subtree
(
"shared"
,
self
.
_shared_cpu_id_list
())
create_cpuset_subtree
(
"exclusive"
,
self
.
_exclusive_cpu_id_list
())
# separate CPUs in exclusive set
exclusive_cpu_path
=
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
)
write_file
(
"1"
,
exclusive_cpu_path
+
"/cpuset.cpu_exclusive"
)
# exclusive
write_file
(
"0"
,
exclusive_cpu_path
+
"/cpuset.mems"
)
# it doesn't work without that
for
cpu
in
self
.
_exclusive_cpu_id_list
():
cpu_path
=
self
.
_prepare_folder
(
cpu_path
=
self
.
_prepare_folder
(
os
.
path
.
join
(
self
.
cpuset_path
,
"cpu"
+
str
(
cpu
)))
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
,
"cpu"
+
str
(
cpu
)))
with
open
(
cpu_path
+
"/cpuset.cpus"
,
"wt"
)
as
fx
:
write_file
(
str
(
cpu
),
cpu_path
+
"/cpuset.cpus"
)
# manage only this cpu
fx
.
write
(
str
(
cpu
))
# this cgroup manages only this cpu
write_file
(
"1"
,
cpu_path
+
"/cpuset.cpu_exclusive"
)
# exclusive
with
open
(
cpu_path
+
"/cpuset.cpu_exclusive"
,
"wt"
)
as
fx
:
write_file
(
"0"
,
cpu_path
+
"/cpuset.mems"
)
# it doesn't work without that
fx
.
write
(
"1"
)
# manages it exclusively
with
open
(
cpu_path
+
"/cpuset.mems"
,
"wt"
)
as
fx
:
fx
.
write
(
"0"
)
# it doesn't work without that
def
instance
(
self
,
partition
):
def
instance
(
self
,
partition
):
"""Control runtime state of the computer."""
"""Control runtime state of the computer."""
if
not
os
.
path
.
exists
(
os
.
path
.
join
(
self
.
cpuset_path
,
"
cpu0
"
)):
if
not
os
.
path
.
exists
(
os
.
path
.
join
(
self
.
cpuset_path
,
"
shared
"
)):
# check whether the computer was formatted
# check whether the computer was formatted
logger
.
warning
(
"CGROUP's CPUSET Manager cannot update computer because it is not cpuset-formatted."
)
logger
.
warning
(
"CGROUP's CPUSET Manager cannot update computer because it is not cpuset-formatted."
)
return
return
...
@@ -73,15 +93,13 @@ class Manager(object):
...
@@ -73,15 +93,13 @@ class Manager(object):
uid
,
gid
=
partition
.
getUserGroupId
()
uid
,
gid
=
partition
.
getUserGroupId
()
uname
=
pwd
.
getpwuid
(
uid
).
pw_name
uname
=
pwd
.
getpwuid
(
uid
).
pw_name
if
uname
not
in
power_user_list
:
if
uname
not
in
power_user_list
:
logger
.
warning
(
"
User {}
not allowed to modify cpuset! "
logger
.
warning
(
"
{} is
not allowed to modify cpuset! "
"Allowed users are in {} option in config file."
.
format
(
"Allowed users are in {} option in config file."
.
format
(
uname
,
self
.
config_power_user_option
))
uname
,
self
.
config_power_user_option
))
return
return
# prepare paths to tasks file for all and per-cpu
# prepare paths to tasks file for all and per-cpu
tasks_file
=
os
.
path
.
join
(
self
.
cpuset_path
,
"tasks"
)
tasks_file
=
os
.
path
.
join
(
self
.
cpuset_path
,
"tasks"
)
cpu_tasks_file_list
=
[
os
.
path
.
join
(
cpu_folder
,
"tasks"
)
for
cpu_folder
in
self
.
_cpu_folder_list
()]
# Gather exclusive CPU usage map {username: set[cpu_id]}
# Gather exclusive CPU usage map {username: set[cpu_id]}
# We do not need to gather that since we have no limits yet
# We do not need to gather that since we have no limits yet
...
@@ -93,13 +111,14 @@ class Manager(object):
...
@@ -93,13 +111,14 @@ class Manager(object):
# process = psutil.Process(pid)
# process = psutil.Process(pid)
# cpu_usage[process.username()].add(cpu_id)
# cpu_usage[process.username()].add(cpu_id)
# Move all PIDs from the pool of all CPUs onto
the first exclusive CPU
.
# Move all PIDs from the pool of all CPUs onto
shared CPUs
.
running_list
=
sorted
(
list
(
map
(
int
,
read_file
(
tasks_file
).
split
())),
reverse
=
True
)
running_list
=
sorted
(
list
(
map
(
int
,
read_file
(
tasks_file
).
split
())),
reverse
=
True
)
first_cpu
=
self
.
_cpu_id_list
()[
0
]
shared_tasks_path
=
os
.
path
.
join
(
self
.
cpuset_path
,
"shared"
,
"tasks"
)
exclusive_tasks_path
=
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
,
"tasks"
)
success_set
,
refused_set
=
set
(),
set
()
success_set
,
refused_set
=
set
(),
set
()
for
pid
in
running_list
:
for
pid
in
running_list
:
try
:
try
:
self
.
_move_task
(
pid
,
first_cpu
)
write_file
(
"{:d}
\
n
"
.
format
(
pid
),
shared_tasks_path
,
mode
=
self
.
task_write_mode
)
success_set
.
add
(
pid
)
success_set
.
add
(
pid
)
time
.
sleep
(
0.01
)
time
.
sleep
(
0.01
)
except
IOError
as
e
:
except
IOError
as
e
:
...
@@ -108,37 +127,40 @@ class Manager(object):
...
@@ -108,37 +127,40 @@ class Manager(object):
"Suceeded in moving {:d} PIDs {!s}
\
n
"
.
format
(
"Suceeded in moving {:d} PIDs {!s}
\
n
"
.
format
(
len
(
refused_set
),
refused_set
,
len
(
success_set
),
success_set
))
len
(
refused_set
),
refused_set
,
len
(
success_set
),
success_set
))
cpu_folder_list
=
self
.
_cpu_folder_list
()
generic_cpu_path
=
cpu_folder_list
[
0
]
exclusive_cpu_path_list
=
cpu_folder_list
[
1
:]
# Gather all running PIDs for filtering out stale PIDs
# Gather all running PIDs for filtering out stale PIDs
running_pid_set
=
set
(
running_list
)
running_pid_set
=
set
(
running_list
)
running_pid_set
.
update
(
map
(
int
,
read_file
(
cpu_tasks_file_list
[
0
]
).
split
()))
running_pid_set
.
update
(
map
(
int
,
read_file
(
shared_tasks_path
).
split
()))
#
g
ather already exclusively running PIDs
#
G
ather already exclusively running PIDs
exclusive_pid_set
=
set
()
exclusive_pid_set
=
set
()
for
cpu_tasks_file
in
cpu_tasks_file_list
[
1
:]
:
for
cpu_tasks_file
in
[
exclusive_tasks_path
,
]
+
self
.
_exclusive_cpu_tasks_list
()
:
exclusive_pid_set
.
update
(
map
(
int
,
read_file
(
cpu_tasks_file
).
split
()))
exclusive_pid_set
.
update
(
map
(
int
,
read_file
(
cpu_tasks_file
).
split
()))
# Move processes to their demanded exclusive CPUs
# move processes to their demanded exclusive CPUs
with
open
(
request_file
,
"rt"
)
as
fi
:
request_pid_list
=
map
(
int
,
read_file
(
request_file
).
split
())
# empty the request file (we will write back only PIDs which weren't moved)
write_file
(
""
,
request_file
)
# take such PIDs which are either really running or are not already exclusive
# take such PIDs which are either really running or are not already exclusive
request_pid_list
=
[
int
(
pid
)
for
pid
in
fi
.
read
().
split
()
for
request_pid
in
filter
(
lambda
pid
:
pid
in
running_pid_set
and
pid
not
in
exclusive_pid_set
,
request_pid_list
):
if
int
(
pid
)
in
running_pid_set
or
int
(
pid
)
not
in
exclusive_pid_set
]
with
open
(
request_file
,
"wt"
)
as
fo
:
fo
.
write
(
""
)
# empty file (we will write back only PIDs which weren't moved)
for
request_pid
in
request_pid_list
:
assigned_cpu
=
self
.
_move_to_exclusive_cpu
(
request_pid
)
assigned_cpu
=
self
.
_move_to_exclusive_cpu
(
request_pid
)
if
assigned_cpu
<
0
:
if
assigned_cpu
<
0
:
# if no exclusive CPU was assigned - write the PID back and try other time
# if no exclusive CPU was assigned - write the PID back and try other time
with
open
(
request_file
,
"at"
)
as
fo
:
write_file
(
"{:d}
\
n
"
.
format
(
request_pid
),
request_file
,
mode
=
"at"
)
fo
.
write
(
str
(
request_pid
)
+
"
\
n
"
)
def
_
cpu_folder
_list
(
self
):
def
_
exclusive_cpu_tasks
_list
(
self
):
"""Return list of folders for exclusive cpu cores."""
"""Return list of folders for exclusive cpu cores."""
return
[
os
.
path
.
join
(
self
.
cpuset_path
,
"cpu"
+
str
(
cpu_id
))
return
[
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
,
"cpu"
+
str
(
cpu_id
),
"tasks"
)
for
cpu_id
in
self
.
_cpu_id_list
()]
for
cpu_id
in
self
.
_exclusive_cpu_id_list
()]
def
_shared_cpu_id_list
(
self
):
"""Return list of shared CPU core IDs."""
cpu_id_list
=
self
.
_cpu_id_list
()
return
cpu_id_list
[:
int
(
math
.
ceil
(
len
(
cpu_id_list
)
/
2
))]
def
_exclusive_cpu_id_list
(
self
):
"""Return list of exclusive CPU core IDs."""
cpu_id_list
=
self
.
_cpu_id_list
()
return
cpu_id_list
[
int
(
math
.
ceil
(
len
(
cpu_id_list
)
/
2
)):]
def
_cpu_id_list
(
self
):
def
_cpu_id_list
(
self
):
"""Extract IDs of available CPUs and return them as a list.
"""Extract IDs of available CPUs and return them as a list.
...
@@ -162,12 +184,12 @@ class Manager(object):
...
@@ -162,12 +184,12 @@ class Manager(object):
:return: int, cpu_id of used CPU, -1 if placement was not possible
:return: int, cpu_id of used CPU, -1 if placement was not possible
"""
"""
exclusive_cpu_list
=
self
.
_
cpu_id_list
()[
1
:]
exclusive_cpu_list
=
self
.
_
exclusive_cpu_id_list
()
for
exclusive_cpu
in
exclusive_cpu_list
:
for
exclusive_cpu
in
exclusive_cpu_list
:
# gather tasks assigned to current exclusive CPU
# gather tasks assigned to current exclusive CPU
task_path
=
os
.
path
.
join
(
self
.
cpuset_path
,
"cpu"
+
str
(
exclusive_cpu
),
"tasks"
)
task_path
=
os
.
path
.
join
(
with
open
(
task_path
,
"rt"
)
as
fi
:
self
.
cpuset_path
,
"exclusive"
,
"cpu"
+
str
(
exclusive_cpu
),
"tasks"
)
task_list
=
fi
.
read
(
).
split
()
task_list
=
read_file
(
task_path
).
split
()
if
len
(
task_list
)
>
0
:
if
len
(
task_list
)
>
0
:
continue
# skip occupied CPUs
continue
# skip occupied CPUs
return
self
.
_move_task
(
pid
,
exclusive_cpu
)[
1
]
return
self
.
_move_task
(
pid
,
exclusive_cpu
)[
1
]
...
@@ -179,8 +201,11 @@ class Manager(object):
...
@@ -179,8 +201,11 @@ class Manager(object):
cpu_mode can be "performance" or "powersave"
cpu_mode can be "performance" or "powersave"
"""
"""
known_cpu_mode_list
=
(
"performance"
,
"powersave"
)
known_cpu_mode_list
=
(
"performance"
,
"powersave"
)
with
open
(
os
.
path
.
join
(
self
.
cpuset_path
,
"cpu"
+
str
(
cpu_id
),
"tasks"
),
self
.
task_write_mode
)
as
fo
:
if
cpu_id
not
in
self
.
_exclusive_cpu_id_list
():
fo
.
write
(
str
(
pid
)
+
"
\
n
"
)
raise
ValueError
(
"Cannot assign to cpu{:d} because it is shared"
.
format
(
cpu_id
))
# write the PID into concrete tasks file
cpu_tasks
=
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
,
"cpu"
+
str
(
cpu_id
),
"tasks"
)
write_file
(
"{:d}
\
n
"
.
format
(
pid
),
cpu_tasks
,
mode
=
self
.
task_write_mode
)
# set the core to `cpu_mode`
# set the core to `cpu_mode`
scaling_governor_file
=
"/sys/devices/system/cpu/cpu{:d}/cpufreq/scaling_governor"
.
format
(
cpu_id
)
scaling_governor_file
=
"/sys/devices/system/cpu/cpu{:d}/cpufreq/scaling_governor"
.
format
(
cpu_id
)
if
os
.
path
.
exists
(
scaling_governor_file
):
if
os
.
path
.
exists
(
scaling_governor_file
):
...
@@ -216,5 +241,9 @@ def read_file(path, mode="rt"):
...
@@ -216,5 +241,9 @@ def read_file(path, mode="rt"):
def
write_file
(
content
,
path
,
mode
=
"wt"
):
def
write_file
(
content
,
path
,
mode
=
"wt"
):
try
:
with
open
(
path
,
mode
)
as
fo
:
with
open
(
path
,
mode
)
as
fo
:
fo
.
write
(
content
)
fo
.
write
(
content
)
except
IOError
as
e
:
logger
.
error
(
"Cannot write to {}"
.
format
(
path
))
raise
\ No newline at end of file
slapos/tests/slapformat.py
View file @
8bb366ab
...
@@ -744,31 +744,49 @@ class TestComputerWithCPUSet(SlapformatMixin):
...
@@ -744,31 +744,49 @@ class TestComputerWithCPUSet(SlapformatMixin):
self
.
assertEqual
(
self
.
computer
.
_manager_list
[
0
].
_cpu_id_list
(),
self
.
cpu_list
)
self
.
assertEqual
(
self
.
computer
.
_manager_list
[
0
].
_cpu_id_list
(),
self
.
cpu_list
)
# This should created per-cpu groups and move all tasks in CPU pool into cpu0
# This should created per-cpu groups and move all tasks in CPU pool into cpu0
self
.
computer
.
format
(
alter_network
=
False
,
alter_user
=
False
)
self
.
computer
.
format
(
alter_network
=
False
,
alter_user
=
False
)
# Test files creation for exclusive CPUs
# Test files creation for exclusive CPUs
for
cpu_id
in
self
.
cpu_list
:
# First half of CPUs is shared
cpu_n_path
=
os
.
path
.
join
(
self
.
cpuset_path
,
"cpu"
+
str
(
cpu_id
))
shared_cpuset_path
=
os
.
path
.
join
(
self
.
cpuset_path
,
"shared"
)
for
cpu_id
in
self
.
cpu_list
[:
2
]:
self
.
assertFalse
(
os
.
path
.
exists
(
os
.
path
.
join
(
shared_cpuset_path
,
"cpu"
+
str
(
cpu_id
))),
"Specific cpu<N> doesn't make sense in shared cpuset."
)
# The second half of CPUs most be ready for exclusive
exclusive_cpuset_path
=
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
)
for
cpu_id
in
self
.
cpu_list
[
2
:]:
cpu_n_path
=
os
.
path
.
join
(
exclusive_cpuset_path
,
"cpu"
+
str
(
cpu_id
))
self
.
assertEqual
(
str
(
cpu_id
),
file_content
(
os
.
path
.
join
(
cpu_n_path
,
"cpuset.cpus"
)))
self
.
assertEqual
(
str
(
cpu_id
),
file_content
(
os
.
path
.
join
(
cpu_n_path
,
"cpuset.cpus"
)))
self
.
assertEqual
(
"1"
,
file_content
(
os
.
path
.
join
(
cpu_n_path
,
"cpuset.cpu_exclusive"
)))
self
.
assertEqual
(
"1"
,
file_content
(
os
.
path
.
join
(
cpu_n_path
,
"cpuset.cpu_exclusive"
)))
if
cpu_id
>
0
:
for
cpu_id
in
self
.
cpu_list
[:
2
]:
self
.
assertEqual
(
""
,
file_content
(
os
.
path
.
join
(
cpu_n_path
,
"tasks"
)))
self
.
assertFalse
(
os
.
path
.
exists
(
os
.
path
.
join
(
exclusive_cpuset_path
,
"cpu"
+
str
(
cpu_id
))),
"Shared CPU cannot appear in EXCLUSIVE set."
)
# Test moving tasks from generic core to private core
# Test moving tasks from generic core to private core
# request PID 1001 to be moved to its private CPU
# request PID 1001 to be moved to its private CPU
request_file_path
=
os
.
path
.
join
(
self
.
computer
.
partition_list
[
0
].
path
,
request_file_path
=
os
.
path
.
join
(
self
.
computer
.
partition_list
[
0
].
path
,
slapos
.
manager
.
cpuset
.
Manager
.
cpu_exclusive_file
)
slapos
.
manager
.
cpuset
.
Manager
.
cpu_exclusive_file
)
file_write
(
"1001
\
n
"
,
request_file_path
)
# ask exclusivity for existing and non-existing PID
file_write
(
"1001
\
n
9999
\
n
"
,
request_file_path
)
# Simulate slapos instance call to perform the actual movement
# Simulate slapos instance call to perform the actual movement
self
.
computer
.
_manager_list
[
0
].
instance
(
self
.
computer
.
_manager_list
[
0
].
instance
(
SlapGridPartitionMock
(
self
.
computer
.
partition_list
[
0
]))
SlapGridPartitionMock
(
self
.
computer
.
partition_list
[
0
]))
# Simulate cgroup behaviour - empty tasks in the pool
# Simulate cgroup behaviour - empty tasks in the pool
file_write
(
""
,
os
.
path
.
join
(
self
.
cpuset_path
,
"tasks"
))
file_write
(
""
,
os
.
path
.
join
(
self
.
cpuset_path
,
"tasks"
))
# Test that format moved all PIDs from CPU pool into CPU0
# Test that format moved all PIDs from CPU pool into shared pool
tasks_at_cpu0
=
file_content
(
os
.
path
.
join
(
self
.
cpuset_path
,
"cpu0"
,
"tasks"
)).
split
()
shared_task_list
=
file_content
(
os
.
path
.
join
(
self
.
cpuset_path
,
"shared"
,
"tasks"
)).
split
()
self
.
assertIn
(
"1000"
,
tasks_at_cpu0
)
self
.
assertIn
(
"1000"
,
shared_task_list
)
self
.
assertIn
(
"1002"
,
shared_task_list
)
# test if the moving suceeded into any provate CPUS (id>0)
# test if the moving suceeded into any provate CPUS (id>0)
self
.
assertTrue
(
any
(
"1001"
in
file_content
(
exclusive_task
)
exclusive_tasks_path_list
=
[
for
exclusive_task
in
glob
.
glob
(
os
.
path
.
join
(
self
.
cpuset_path
,
"cpu[1-9]"
,
"tasks"
))))
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
,
"tasks"
),
self
.
assertIn
(
"1002"
,
tasks_at_cpu0
)
]
+
glob
.
glob
(
os
.
path
.
join
(
self
.
cpuset_path
,
"exclusive"
,
"cpu[1-9]"
,
"tasks"
))
self
.
assertTrue
(
any
(
"1001"
in
file_content
(
exclusive_tasks_path
)
for
exclusive_tasks_path
in
exclusive_tasks_path_list
))
self
.
assertFalse
(
any
(
"9999"
in
file_content
(
exclusive_tasks_path
)
for
exclusive_tasks_path
in
exclusive_tasks_path_list
))
# slapformat should remove successfully moved PIDs from the .slapos-cpu-exclusive file
# slapformat should remove successfully moved PIDs from the .slapos-cpu-exclusive file
self
.
assertEqual
(
""
,
file_content
(
request_file_path
).
strip
())
self
.
assertEqual
(
""
,
file_content
(
request_file_path
).
strip
())
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment