wireguard.m4


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341

dnl // Tamarin uses ' which is an m4 close quote. So use <! !> for quoting instead.
changequote(<!,!>)
changecom(<!@,@!>)
/*
 * Protocol:    Wireguard protocol
 * Modeler:     Kevin Milner & Jason Donenfeld
 * Date:        2017
 * Source:      Original
 * Status:      Basically complete? Use the 'i' heuristic to autoprove.
 *
 * TODO:
 * - Implement identity hiding using observational equivalence, instead of the weaker surrogate-based property.
 * - Prove indistinguishability using observational equivalence.
 * - Model ECDH(private, NULL) = NULL
 */

theory WireGuard
begin

builtins: hashing, diffie-hellman
/* Normally an aead would be arity 4, but in the handshake the nonce is always
 * the fixed value 0 so for legibility we do not include it */
functions: aead/3, decrypt/2, verify/3, true/0
/* The plaintext can be recovered with the key */
equations: decrypt(aead(k, p, a), k) = p
/* The authentication can be checked with the key and AAD */
equations: verify(aead(k, p, a), a, k) = true

/* This restriction tells Tamarin that whenever an Eq( ) fact occurs,
 * the terms in it must be equal. This allows us to model rules that
 * only trigger if e.g. the AEAD correctly verifies */
restriction Eq_testing: "All x y #i. Eq(x, y) @ i ==> x = y"

/* === m4 Definitions ===
 * These are mostly used to influence Tamarin's heuristics. They can be
 * commented out by prefixing them with 'dnl'. 
 */

/* Uncomment these to prevent any adversary message modifications,
 * useful for checking exists-trace lemmas and making sure messsages
 * don't require the adversary to reorder terms etc. */
dnl define(In, AuthenticatedMessage($*))
dnl define(Out, AuthenticatedMessage($*))

/* These defines are for the heuristic goal sorting. F_ indicates that the
 * heuristic should prioritize solving it, which we use to solve for where
 * agents got various constraints (like the keys, and key relationships) */
define(AgentKey, F_AgentKey($*))
define(AgentPSK, F_AgentPSK($*))
define(StateInvariants, F_StateInvariants($*))

/* L_ indicates the heuristic should deprioritize solving the goal. In this
 * case, typically agent state can come from just about anywhere so it creates
 * a ton of case distinctions when we're usually only interested in the current
 * session anyway. */
define(State, L_State($*))

/* === Setup and key reveal rules === */

/* Keygen is separate from pairing to allow keys to be paired
 * more than once (if they were generated fresh in the pairing
 * this would not be possible */
rule AgentKeyGen:
    [ Fr(~ltk) ]
    --[DHKey(~ltk)]->
    [!AgentKey(~ltk), Out('g'^~ltk)]

/* Semi-malicious or ignorant agents might share a PSK with multiple
 * parties, so we overapproximate this by allowing the same PSK to be reused
 * arbitrarily. If this finds an attack then it may not be a 'real'
 * attack, but if it doesn't then there is no problem with PSK reuse. */
rule PSKKeyGen:
    [ Fr(~psk) ]
    --[PSKey(~psk)]->
    [ !AgentPSK(~psk) ]

/* Key Reveals for our adversary model. These allow the adversary to reveal
 * any of the keys below at any time, unless restricted in the lemma we wish
 * to prove. */
rule PSK_reveal: 
   [ !AgentPSK(k) ] --[ Reveal_PSK(k) ]-> [ Out(k) ]

rule AgentKey_reveal:
   [ !AgentKey(k) ] --[ Reveal_AK('g'^k) ]-> [ Out(k) ]

rule EphKey_reveal:
   [ !EphKeytoReveal(k) ] --[ Reveal_EphK('g'^k) ]-> [ Out(k) ]

/* Models an agent adding anothers public key out-of-band, we assume that
 * all relationships set up this way are 'sane' and both of the keys involved
 * were generated fresh. */
rule AddPublicKey:
    let pkB = 'g'^~ltkB in
    [ !AgentKey(~ltkA)
    , !AgentKey(~ltkB)
    , !AgentPSK(~psk)
    , Fr(~id)
    ]-->
    [ /* For search efficiency, state is divided into
       * an invariant portion and a variant portion. This
       * allows tamarin to immediately bind the keys back
       * to this initial pairing rule. The fresh ~id is used
       * to identify this pairing. We cache the SiSr in the
       * invariant to reduce Tamarin's variant precomputation time. */
      State(~id, 'no_message_state')
    , !StateInvariants(~id, ~psk, ~ltkA, pkB, pkB^~ltkA)
    ]

/* === Message Rules === */

rule Handshake_Init:
    let pkI   = 'g'^~ltkI
        pekI  = 'g'^~ekI
        eisr  = pkR^~ekI
        /* Constructing the init message m1: */
        cii   = h('noise')
        hii   = h(<cii, 'id', pkR, pekI>)
        ci0   = h(<cii, pekI, '1'>)
        ci1   = h(<ci0, eisr, '1'>)
        ki1   = h(<ci0, eisr, '2'>)
        astat = aead(ki1, <pkI, ~pkISurrogate>, hii)
        hi0   = h(<hii, astat>)
        ci2   = h(<ci1, sisr, '1'>)
        ki2   = h(<ci1, sisr, '2'>)
        ats   = aead(ki2, $ts, hi0)
        hi1   = h(<hi0, ats>)
        /* NOTE: MACs used in the DDoS protection are not modeled, so we assume they are
         * some arbitrary public values (i.e. known to the adversary, like a fixed string). */
        m1    = <'1', ~sidI, pekI, astat, ats, $mac1, $mac2> in
    [ /* Init can be triggered at any time, even when currently performing
       * another role or on another stage. This could happen e.g. because of a timeout.
       * As such we bind the previous state as 'anything' and discard it. */
      State(~id, anything)
    , !StateInvariants(~id, ~psk, ~ltkI, pkR, sisr)
    , Fr(~sidI)
    , Fr(~ekI)
    /* The pkISurrogate is used later to approximate identity hiding. */
    , Fr(~pkISurrogate)
    ]-->
    [ State(~id, <'init', ~sidI, ~ekI, ci2, ki2, hi1>)
      /* F_SolveInit is a bit of a hack to help with Tamarin's heuristics. It allows Tamarin to
       * prioritize solving backwards from the Handshake_Complete rule even though the State
       * fact is deprioritized by the m4 definitions above. This will not be necessary in a
       * future version of Tamarin. */
    , F_SolveInit(~id, ~psk, <'init', ~sidI, ~ekI, ci2, ki2, hi1>)
    , !EphKeytoReveal(~ekI)
    , Out(m1)
    ]

rule Handshake_Resp:
    let pkR   = 'g'^~ltkR
        pekR  = 'g'^~ekR
        eisr  = pekI^~ltkR
        eier  = pekI^~ekR
        sier  = pkI^~ekR
        /* Reconstructing what should be in m1: */
        cri   = h('noise')
        hri   = h(<cri, 'id', pkR, pekI>)
        cr0   = h(<cri, pekI, '1'>)
        cr1   = h(<cr0, eisr, '1'>)
        kr1   = h(<cr0, eisr, '2'>)
        astat = aead(kr1, <pkI, pkISurrogate>, hri)
        hr0   = h(<hri, astat>)
        cr2   = h(<cr1, sisr, '1'>)
        kr2   = h(<cr1, sisr, '2'>)
        ats   = aead(kr2, $ts, hr0)
        hr1   = h(<hr0, ats>)
        m1    = <'1', sidI, pekI, astat, ats, $mac1, $mac2> /* NOTE: MACs used in DDoS protection are not modeled. */
        /* Constructing the response message m2: */
        cr3   = h(<cr2, pekR, '1'>)
        hr2   = h(<hr1, pekR>)
        cr4   = h(<cr3, eier, '1'>)
        cr5   = h(<cr4, sier, '1'>)
        cr6   = h(<cr5, ~psk, '1'>)
        hrt   = h(<cr5, ~psk, '2'>)
        kr6   = h(<cr5, ~psk, '3'>)
        hr3   = h(<hr2, hrt>)
        aempt = aead(kr6, 'e', hr3)
        hr4   = h(<hr3, aempt>)
        m2    = <'2', sidI, ~sidR, pekR, aempt, $mac1, $mac2> in /* NOTE: MACs used in DDoS protection are not modeled. */
    [ State(~id, anything)
    , !StateInvariants(~id, ~psk, ~ltkR, pkI, sisr)
    , Fr(~ekR)
    , Fr(~sidR)
    , In(m1)
    ]--[
        /* In the real protocol, this isn't actually cr6, but is rather derived from it
         * via some more hashing, but it doesn't make a difference here -- if the adversary knows cr6,
         * it can compute the derived key. */
        RKeys(<pkI, pkR, pekI, pekR, ~psk, cr6>)
      , Identity_Surrogate(pkISurrogate)
    ]->
    [ State(~id, <'transport_unconfirmed', ~sidR, pekI, pekR, cr6>)
    , F_SolveResp(~id, ~psk, <'transport_unconfirmed', ~sidR, pekI, pekR, cr6>) /* This is used for the same purpose as F_SolveInit above */
    , !EphKeytoReveal(~ekR)
    , Out(m2)
    ]

rule Handshake_Complete:
    let pkI   = 'g'^~ltkI
        pekI  = 'g'^~ekI
        eier  = pekR^~ekI
        sier  = pekR^~ltkI
        /* Reconstruct what should be in m2: */
        ci3   = h(<ci2, pekR, '1'>)
        hi2   = h(<hi1, pekR>)
        ci4   = h(<ci3, eier, '1'>)
        ci5   = h(<ci4, sier, '1'>)
        ci6   = h(<ci5, ~psk, '1'>)
        hit   = h(<ci5, ~psk, '2'>)
        ki6   = h(<ci5, ~psk, '3'>)
        hi3   = h(<hi2, hit>)
        aempt = aead(ki6, 'e', hi3)
        hi4   = h(<hi3, aempt>)
        m2    = <'2', sidI, sidR, pekR, aempt, $mac1, $mac2>
        /* We assume the first transport message is 'as weak as possible', that is, all values
         * in it are public other than the key used to encrypt. */
        mtr   = <'4', sidR, aead(ci6, 'message', '0')> in
    [ State(~id, <'init', sidI, ~ekI, ci2, ki2, hi1>)
    , F_SolveInit(~id, ~psk, <'init', sidI, ~ekI, ci2, ki2, hi1>)
    , !StateInvariants(~id, ~psk, ~ltkI, pkR, sisr)
    , In(m2)
    ]--[
      /* In the real protocol, this isn't actually ci6, but is rather derived from it
       * via some more hashing, but it doesn't make a difference here (as with cr6 above). */
      IKeys(<pkI, pkR, pekI, pekR, ~psk, ci6>)
    ]->
    [ State(~id, <'transport', sidI, ci6>)
    , Out(mtr)
    ]

/* === Key Confirmation ===
 *
 * For proving agreement properties after the first transport message
 * This is not faithfully modelled, since we don't care about the contents
 * of the transport message--instead it's generically 'anything encrypted
 * with the transport key I just set up'. */

rule R_ConfirmedTransportMessage:
    let mtr = <'4', sid, data> in
    [ State(~id, <'transport_unconfirmed', sidR, pekI, pekR, cr>)
    , F_SolveResp(~id, ~psk, <'transport_unconfirmed', sidR, pekI, pekR, cr>)
    , !StateInvariants(~id, ~psk, ~ltkR, pkI, sisr)
    , In(mtr)
    ]--[
      RConfirm(<pkI, 'g'^~ltkR, pekI, pekR, ~psk, cr>)
      //We manually verify this instead of the recomputation used for other terms above, since
      //morally R may not know the contents of the message.
    , Eq(verify(data, '0', cr), true)
    ]->
    [ State(~id, <'transport', sidR, cr>) ]
    
/* === Session Traces ===
 *
 * We show that at least the protocol works. */

lemma exists_session: exists-trace
    "Ex pki pkr peki pekr psk ck #i #j.
        IKeys(<pki, pkr, peki, pekr, psk, ck>) @ i
        & RConfirm(<pki, pkr, peki, pekr, psk, ck>) @ j & #i < #j"

/* There are only three numbers, 0, 1, and infinity. So 2 == infinity */
lemma exists_two_sessions: exists-trace
    "Ex pki pkr sesskeys sesskeys2 #i #j #i2 #j2.
        IKeys(<pki, pkr, sesskeys>) @ i
        & RConfirm(<pki, pkr, sesskeys>) @ j & #i < #j
        & IKeys(<pki, pkr, sesskeys2>) @ i2 & RConfirm(<pki, pkr, sesskeys2>) @ j2 & #i2 < #j2
        & #i < #i2 & not(sesskeys = sesskeys2)"


/* === Agreement Properties === */

lemma I_disagreement_implies_Sr_or_SiEi_compromise_and_PSK_compromise[reuse]:
    "All pki pkr peki pekr psk ck #i.
        /* If I believes they have completed a handshake with R */
        IKeys(<pki, pkr, peki, pekr, psk, ck>) @ i
        /* but R doesn't have a matching session */
        & not(Ex #j. #j < #i & RKeys(<pki, pkr, peki, pekr, psk, ck>) @ j)
    ==> /* Then the PSK was compromised (or not in use) and */
        (Ex #j. Reveal_PSK(psk) @ j & #j < #i) & (
        /* either R's static was compromised */
        (Ex #j. Reveal_AK(pkr) @ j & #j < #i)
        /* or both I's static and ephemeral were already compromised */
        | (Ex #j #j2. Reveal_AK(pki) @ j & #j < #i & Reveal_EphK(peki) @ j2 & #j2 < #i)
        )"

lemma R_disagreement_implies_Si_or_SrEr_compromise_and_PSK_compromise[reuse]:
    "All pki pkr peki pekr psk ck #i.
        /* If R believes they have a confirmed session with I */
        RConfirm(<pki, pkr, peki, pekr, psk, ck>) @ i
        /* but I doesn't have a matching session */
        & not(Ex #j. #j < #i & IKeys(<pki, pkr, peki, pekr, psk, ck>) @ j)
    ==> /* Then the PSK was compromised (or not in use) and */
        (Ex #j. Reveal_PSK(psk) @ j & #j < #i) & (
        /* either I's static was compromised */
        (Ex #j. Reveal_AK(pki) @ j & #j < #i)
        /* or both R's static and ephemeral were already compromised */
        | (Ex #j #j2. Reveal_AK(pkr) @ j & Reveal_EphK(pekr) @ j2 & #j2 < #i & #j < #i)
        )"

lemma session_uniqueness:
    /* For both I and R, a 'confirmed session key' will always be unique (even if all keys are compromised)
     * This follows from I and R generating random ephemeral values. Note that this could be violated if the
     * RNG can be controlled instead of just revealed, which we do not model. */
    "(All pki pkr peki pekr psk ck #i.
        IKeys(<pki, pkr, peki, pekr, psk, ck>) @ i
    ==> not(Ex peki2 pekr2 #k. IKeys(<pki, pkr, peki2, pekr2, psk, ck>) @ k & not(#k = #i)))
    &(All pki pkr peki pekr psk ck #i.
        RConfirm(<pki, pkr, peki, pekr, psk, ck>) @ i
    ==> not(Ex peki2 pekr2 psk2 #k. RConfirm(<pki, pkr, peki2, pekr2, psk2, ck>) @ k & not(#k = #i)))"

/* === Secrecy Properties === */

lemma key_secrecy[reuse]:
    "(All pki pkr peki pekr psk ck #i #i2.
        /* If I and R agree on keys */
        IKeys(<pki, pkr, peki, pekr, psk, ck>) @ i & RKeys(<pki, pkr, peki, pekr, psk, ck>) @ i2
    ==> /* Either the adversary doesn't know the keys */
        not(Ex #j. K(ck) @ j) 
        /* or the psk was compromised (or not in use) */
        | ((Ex #j. Reveal_PSK(psk) @ j) & (
           /* and pair of keys from the same agent was revealed (at any time) */
           (Ex #j #j2. Reveal_AK(pki) @ j & Reveal_EphK(peki) @ j2)
         | (Ex #j #j2. Reveal_AK(pkr) @ j & Reveal_EphK(pekr) @ j2))
        ))"

lemma identity_hiding:
    /* Since the public static is always symbolically known to the adversary, we represent identity
     * hiding by whether the adversary could learn some other value that is put in the first message at the
     * same position as the public static. */
    "All pki pkr peki pekr ck surrogate #i #j.
        /* If R received a handshake init with a particular identity surrogate */
        RKeys(<pki, pkr, peki, pekr, ck>) @ i & Identity_Surrogate(surrogate) @ i
        /* And the adversary knows that surrogate for the identity */
        & K(surrogate) @ j
    ==> /* Then the adversary compromised at least one of R's static, I's static, or I's ephemeral */
        (Ex #j. Reveal_AK(pkr) @ j) | (Ex #j. Reveal_AK(pki) @ j) | (Ex #j. Reveal_EphK(peki) @ j)"

end

// vim: ft=spthy