commit b3b27ed008a7813fa03f45f3e9f02aa3b68a450c · pyrox.dev/nixpkgs

+46 -4
nixos/tests/consul.nix
···

       145
       145
        
           client2.succeed("[ $(consul kv get testkey) == 42 ]")

     

       146
       146
        
       

     

       147
       147
        
       

     

       148
       148
       -
           def rolling_reboot_test():

     

       148
       148
       +
           def rolling_reboot_test(proper_rolling_procedure=True):

     

       149
       149
        
               """

     

       150
       150
        
               Tests that the cluster can tolearate failures of any single server,

     

       151
       151
        
               following the recommended rolling upgrade procedure from

     

       152
       152
       -
               https://www.consul.io/docs/upgrading#standard-upgrades

     

       152
       152
       +
               https://www.consul.io/docs/upgrading#standard-upgrades.

     

       153
       153
       +
       

     

       154
       154
       +
               Optionally, `proper_rolling_procedure=False` can be given

     

       155
       155
       +
               to wait only for each server to be back `Healthy`, not `Stable`

     

       156
       156
       +
               in the Raft consensus, see Consul setting `ServerStabilizationTime` and

     

       157
       157
       +
               https://github.com/hashicorp/consul/issues/8118#issuecomment-645330040.

     

       153
       158
        
               """

     

       154
       159
        
       

     

       155
       160
        
               for server in servers:

     
···

       168
       173
        
                   # Restart crashed machine.

     

       169
       174
        
                   server.start()

     

       170
       175
        
       

     

       171
       171
       -
                   # Wait for recovery.

     

       172
       172
       -
                   wait_for_healthy_servers()

     

       176
       176
       +
                   if proper_rolling_procedure:

     

       177
       177
       +
                       # Wait for recovery.

     

       178
       178
       +
                       wait_for_healthy_servers()

     

       179
       179
       +
                   else:

     

       180
       180
       +
                       # NOT proper rolling upgrade procedure, see above.

     

       181
       181
       +
                       wait_for_all_machines_alive()

     

       173
       182
        
       

     

       174
       183
        
                   # Wait for client connections.

     

       175
       184
        
                   client1.wait_until_succeeds("consul kv get -recurse")

     
···

       181
       190
        
                   client2.succeed("consul kv delete testkey")

     

       182
       191
        
       

     

       183
       192
        
       

     

       193
       193
       +
           def all_servers_crash_simultaneously_test():

     

       194
       194
       +
               """

     

       195
       195
       +
               Tests that the cluster will eventually come back after all

     

       196
       196
       +
               servers crash simultaneously.

     

       197
       197
       +
               """

     

       198
       198
       +
       

     

       199
       199
       +
               for server in servers:

     

       200
       200
       +
                   server.crash()

     

       201
       201
       +
       

     

       202
       202
       +
               for server in servers:

     

       203
       203
       +
                   server.start()

     

       204
       204
       +
       

     

       205
       205
       +
               # Wait for recovery.

     

       206
       206
       +
               wait_for_healthy_servers()

     

       207
       207
       +
       

     

       208
       208
       +
               # Wait for client connections.

     

       209
       209
       +
               client1.wait_until_succeeds("consul kv get -recurse")

     

       210
       210
       +
               client2.wait_until_succeeds("consul kv get -recurse")

     

       211
       211
       +
       

     

       212
       212
       +
               # Do some consul actions with servers back up.

     

       213
       213
       +
               client1.succeed("consul kv put testkey 44")

     

       214
       214
       +
               client2.succeed("[ $(consul kv get testkey) == 44 ]")

     

       215
       215
       +
               client2.succeed("consul kv delete testkey")

     

       216
       216
       +
       

     

       217
       217
       +
       

     

       184
       218
        
           # Run the tests.

     

       219
       219
       +
       

     

       220
       220
       +
           print("rolling_reboot_test()")

     

       185
       221
        
           rolling_reboot_test()

     

       222
       222
       +
       

     

       223
       223
       +
           print("all_servers_crash_simultaneously_test()")

     

       224
       224
       +
           all_servers_crash_simultaneously_test()

     

       225
       225
       +
       

     

       226
       226
       +
           print("rolling_reboot_test(proper_rolling_procedure=False)")

     

       227
       227
       +
           rolling_reboot_test(proper_rolling_procedure=False)

     

       186
       228
        
         '';

     

       187
       229
        
       })