summaryrefslogtreecommitdiffstats
path: root/qa/standalone/mgr/balancer.sh
blob: 7e87cbf4a5f369d8cc1bf8fd1eb2d9b882f26b8c (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
#!/usr/bin/env bash
#
# Copyright (C) 2019 Red Hat <contact@redhat.com>
#
# Author: David Zafman <dzafman@redhat.com>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU Library Public License as published by
# the Free Software Foundation; either version 2, or (at your option)
# any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU Library Public License for more details.
#
source $CEPH_ROOT/qa/standalone/ceph-helpers.sh

function run() {
    local dir=$1
    shift

    export CEPH_MON="127.0.0.1:7102" # git grep '\<7102\>' : there must be only one
    export CEPH_ARGS
    CEPH_ARGS+="--fsid=$(uuidgen) --auth-supported=none "
    CEPH_ARGS+="--mon-host=$CEPH_MON "

    local funcs=${@:-$(set | sed -n -e 's/^\(TEST_[0-9a-z_]*\) .*/\1/p')}
    for func in $funcs ; do
        $func $dir || return 1
    done
}

TEST_POOL1=test1
TEST_POOL2=test2

function TEST_balancer() {
    local dir=$1

    setup $dir || return 1
    run_mon $dir a || return 1
    run_mgr $dir x || return 1
    run_osd $dir 0 || return 1
    run_osd $dir 1 || return 1
    run_osd $dir 2 || return 1
    create_pool $TEST_POOL1 8
    create_pool $TEST_POOL2 8

    wait_for_clean || return 1

    ceph pg dump pgs
    ceph osd set-require-min-compat-client luminous
    ceph balancer status || return 1
    eval MODE=$(ceph balancer status | jq '.mode')
    test $MODE = "none" || return 1
    ACTIVE=$(ceph balancer status | jq '.active')
    test $ACTIVE = "false" || return 1

    ceph balancer ls || return 1
    PLANS=$(ceph balancer ls)
    test "$PLANS" = "[]" || return 1
    ceph balancer eval || return 1
    EVAL="$(ceph balancer eval)"
    test "$EVAL" = "current cluster score 0.000000 (lower is better)"
    ceph balancer eval-verbose || return 1

    ceph balancer pool add $TEST_POOL1 || return 1
    ceph balancer pool add $TEST_POOL2 || return 1
    ceph balancer pool ls || return 1
    eval POOL=$(ceph balancer pool ls | jq 'sort | .[0]')
    test "$POOL" = "$TEST_POOL1" || return 1
    eval POOL=$(ceph balancer pool ls | jq 'sort | .[1]')
    test "$POOL" = "$TEST_POOL2" || return 1
    ceph balancer pool rm $TEST_POOL1 || return 1
    ceph balancer pool rm $TEST_POOL2 || return 1
    ceph balancer pool ls || return 1
    ceph balancer pool add $TEST_POOL1 || return 1

    ceph balancer mode crush-compat || return 1
    ceph balancer status || return 1
    eval MODE=$(ceph balancer status | jq '.mode')
    test $MODE = "crush-compat" || return 1
    ! ceph balancer optimize plan_crush $TEST_POOL1 || return 1
    ceph balancer status || return 1
    eval RESULT=$(ceph balancer status | jq '.optimize_result')
    test "$RESULT" = "Distribution is already perfect" || return 1

    ceph balancer on || return 1
    ACTIVE=$(ceph balancer status | jq '.active')
    test $ACTIVE = "true" || return 1
    sleep 2
    ceph balancer status || return 1
    ceph balancer off || return 1
    ACTIVE=$(ceph balancer status | jq '.active')
    test $ACTIVE = "false" || return 1
    sleep 2

    ceph balancer reset || return 1

    ceph balancer mode upmap || return 1
    ceph balancer status || return 1
    eval MODE=$(ceph balancer status | jq '.mode')
    test $MODE = "upmap" || return 1
    ! ceph balancer optimize plan_upmap $TEST_POOL || return 1
    ceph balancer status || return 1
    eval RESULT=$(ceph balancer status | jq '.optimize_result')
    test "$RESULT" = "Unable to find further optimization, or pool(s) pg_num is decreasing, or distribution is already perfect" || return 1

    ceph balancer on || return 1
    ACTIVE=$(ceph balancer status | jq '.active')
    test $ACTIVE = "true" || return 1
    sleep 2
    ceph balancer status || return 1
    ceph balancer off || return 1
    ACTIVE=$(ceph balancer status | jq '.active')
    test $ACTIVE = "false" || return 1

    teardown $dir || return 1
}

function TEST_balancer2() {
    local dir=$1
    TEST_PGS1=118
    TEST_PGS2=132
    TOTAL_PGS=$(expr $TEST_PGS1 + $TEST_PGS2)
    OSDS=5
    DEFAULT_REPLICAS=3
    # Integer average of PGS per OSD (70.8), so each OSD >= this
    FINAL_PER_OSD1=$(expr \( $TEST_PGS1 \* $DEFAULT_REPLICAS \) / $OSDS)
    # Integer average of PGS per OSD (150)
    FINAL_PER_OSD2=$(expr \( \( $TEST_PGS1 + $TEST_PGS2 \) \* $DEFAULT_REPLICAS \) / $OSDS)

    CEPH_ARGS+="--osd_pool_default_pg_autoscale_mode=off "
    CEPH_ARGS+="--debug_osd=20 "
    setup $dir || return 1
    run_mon $dir a || return 1
    run_mgr $dir x || return 1
    for i in $(seq 0 $(expr $OSDS - 1))
    do
      run_osd $dir $i || return 1
    done

    ceph osd set-require-min-compat-client luminous
    ceph config set mgr mgr/balancer/upmap_max_deviation 1
    ceph balancer mode upmap || return 1
    ceph balancer on || return 1
    ceph config set mgr mgr/balancer/sleep_interval 5

    create_pool $TEST_POOL1 $TEST_PGS1

    wait_for_clean || return 1

    # Wait up to 2 minutes
    OK=no
    for i in $(seq 1 25)
    do
      sleep 5
      if grep -q "Optimization plan is almost perfect" $dir/mgr.x.log
      then
        OK=yes
        break
      fi
    done
    test $OK = "yes" || return 1
    # Plan is found, but PGs still need to move
    sleep 30
    ceph osd df

    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[0].pgs')
    test $PGS -ge $FINAL_PER_OSD1 || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[1].pgs')
    test $PGS -ge $FINAL_PER_OSD1 || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[2].pgs')
    test $PGS -ge $FINAL_PER_OSD1 || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[3].pgs')
    test $PGS -ge $FINAL_PER_OSD1 || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[4].pgs')
    test $PGS -ge $FINAL_PER_OSD1 || return 1

    create_pool $TEST_POOL2 $TEST_PGS2

    # Wait up to 2 minutes
    OK=no
    for i in $(seq 1 25)
    do
      sleep 5
      COUNT=$(grep "Optimization plan is almost perfect" $dir/mgr.x.log | wc -l)
      if test $COUNT = "2"
      then
        OK=yes
        break
      fi
    done
    test $OK = "yes" || return 1
    # Plan is found, but PGs still need to move
    sleep 30
    ceph osd df

    # We should be with plue or minus 1 of FINAL_PER_OSD2
    # This is because here each pool is balanced independently
    MIN=$(expr $FINAL_PER_OSD2 - 1)
    MAX=$(expr $FINAL_PER_OSD2 + 1)
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[0].pgs')
    test $PGS -ge $MIN -a $PGS -le $MAX || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[1].pgs')
    test $PGS -ge $MIN -a $PGS -le $MAX || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[2].pgs')
    test $PGS -ge $MIN -a $PGS -le $MAX || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[3].pgs')
    test $PGS -ge $MIN -a $PGS -le $MAX || return 1
    PGS=$(ceph osd df --format=json-pretty | jq '.nodes[4].pgs')
    test $PGS -ge $MIN -a $PGS -le $MAX || return 1

    teardown $dir || return 1
}

main balancer "$@"

# Local Variables:
# compile-command: "make -j4 && ../qa/run-standalone.sh balancer.sh"
# End: