aboutsummaryrefslogtreecommitdiff
path: root/script/jepsen.garage/src/jepsen/garage/nemesis.clj
blob: 0222e46387d96ac00e254ddf53bec878a33568ee (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
(ns jepsen.garage.nemesis
  (:require [clojure.tools.logging :refer :all]
            [jepsen [control :as c]
             [core :as jepsen]
             [generator :as gen]
             [nemesis :as nemesis]]
            [jepsen.nemesis.combined :as combined]
            [jepsen.garage.daemon :as grg]
            [jepsen.control.util :as cu]))

; ---- reconfiguration nemesis ----

(defn configure-present!
  "Configure node to be active in new cluster layout"
  [test nodes]
  (info "configure-present!" nodes)
  (let [node-ids (c/on-many nodes (c/exec grg/binary :node :id :-q))
        node-id-strs (map (fn [[_ v]] (subs v  0 16)) node-ids)]
    (c/on
      (jepsen/primary test)
      (apply c/exec (concat [grg/binary :layout :assign :-c :1G] node-id-strs)))))

(defn configure-absent!
  "Configure nodes to be active in new cluster layout"
  [test nodes]
  (info "configure-absent!" nodes)
  (let [node-ids (c/on-many nodes (c/exec grg/binary :node :id :-q))
        node-id-strs (map (fn [[_ v]] (subs v  0 16)) node-ids)]
    (c/on
      (jepsen/primary test)
      (apply c/exec (concat [grg/binary :layout :assign :-g] node-id-strs)))))

(defn finalize-config!
  "Apply the proposed cluster layout"
  [test]
  (let [layout-show (c/on (jepsen/primary test) (c/exec grg/binary :layout :show))
        [_ layout-next-version] (re-find #"apply --version (\d+)\n" layout-show)]
    (if layout-next-version
      (do
        (info "layout show: " layout-show "; next-version: " layout-next-version)
        (c/on (jepsen/primary test)
              (c/exec grg/binary :layout :apply :--version layout-next-version)))
      (info "no layout changes to apply"))))

(defn reconfigure-subset
  "Reconfigure cluster with only a subset of nodes"
  [cnt]
  (reify nemesis/Nemesis
    (setup! [this test] this)

    (invoke! [this test op] op
      (case (:f op)
        :start
          (let [[keep-nodes remove-nodes]
                (->> (:nodes test)
                     shuffle
                     (split-at cnt))]
            (info "layout split: keep " keep-nodes ", remove " remove-nodes)
            (configure-present! test keep-nodes)
            (configure-absent! test remove-nodes)
            (finalize-config! test)
            (assoc op :value keep-nodes))
        :stop
          (do
            (info "layout un-split: all nodes=" (:nodes test))
            (configure-present! test (:nodes test))
            (finalize-config! test)
            (assoc op :value (:nodes test)))))

    (teardown! [this test] this)))

; ---- nemesis scenari ----

(defn nemesis-op
  "A generator for a single nemesis operation"
  [op]
  (fn [_ _] {:type :info, :f op}))

(defn reconfiguration-package
  "Cluster reconfiguration nemesis package"
  [opts]
  {:generator        (->>
                       (gen/mix [(nemesis-op :reconfigure-start)
                                 (nemesis-op :reconfigure-stop)])
                       (gen/stagger (:interval opts 5)))
   :final-generator  {:type :info, :f :reconfigure-stop}
   :nemesis          (nemesis/compose
                       {{:reconfigure-start :start
                         :reconfigure-stop :stop} (reconfigure-subset 3)})
   :perf              #{{:name  "reconfigure"
                         :start #{:reconfigure-start}
                         :stop  #{:reconfigur-stop}
                         :color "#A197E9"}}})

(defn scenario-c
  "Clock modifying scenario"
  [opts]
  (combined/clock-package {:db (:db opts), :interval 1, :faults #{:clock}}))

(defn scenario-cp
  "Clock modifying + partition scenario"
  [opts]
  (combined/compose-packages
    [(combined/clock-package {:db (:db opts), :interval 1, :faults #{:clock}})
     (combined/partition-package {:db (:db opts), :interval 1, :faults #{:partition}})]))

(defn scenario-r
  "Cluster reconfiguration scenario"
  [opts]
  (reconfiguration-package {:interval 1}))

(defn scenario-pr
  "Partition + cluster reconfiguration scenario"
  [opts]
  (combined/compose-packages
    [(combined/partition-package {:db (:db opts), :interval 1, :faults #{:partition}})
     (reconfiguration-package {:interval 1})]))

(defn scenario-cpr
  "Clock scramble + partition + cluster reconfiguration scenario"
  [opts]
  (combined/compose-packages
    [(combined/clock-package {:db (:db opts), :interval 1, :faults #{:clock}})
     (combined/partition-package {:db (:db opts), :interval 1, :faults #{:partition}})
     (reconfiguration-package {:interval 1})]))

(defn scenario-dpr
  "Db + partition + cluster reconfiguration scenario"
  [opts]
  (combined/compose-packages
    [(combined/db-package {:db (:db opts), :interval 1, :faults #{:db :pause :kill}})
     (combined/partition-package {:db (:db opts), :interval 1, :faults #{:partition}})
     (reconfiguration-package {:interval 1})]))