1
0
Fork 0
mirror of https://github.com/postmannen/ctrl.git synced 2025-01-18 21:59:30 +00:00
ctrl/requests_keys.go

516 lines
16 KiB
Go
Raw Normal View History

2022-05-19 20:54:33 +02:00
package steward
import (
"bytes"
"encoding/json"
"fmt"
)
// ---
type methodREQPublicKey struct {
event Event
}
func (m methodREQPublicKey) getKind() Event {
return m.event
}
// Handler to get the public ed25519 key from a node.
func (m methodREQPublicKey) handler(proc process, message Message, node string) ([]byte, error) {
// Get a context with the timeout specified in message.MethodTimeout.
ctx, _ := getContextForMethodTimeout(proc.ctx, message)
proc.processes.wg.Add(1)
go func() {
defer proc.processes.wg.Done()
outCh := make(chan []byte)
go func() {
// Normally we would do some logic here, where the result is passed to outCh when done,
// so we can split up the working logic, and f.ex. sending a reply logic.
// In this case this go func and the below select is not needed, but keeping it so the
// structure is the same as the other handlers.
select {
case <-ctx.Done():
case outCh <- proc.nodeAuth.SignPublicKey:
}
}()
select {
// case proc.toRingbufferCh <- []subjectAndMessage{sam}:
case <-ctx.Done():
case out := <-outCh:
// Prepare and queue for sending a new message with the output
// of the action executed.
newReplyMessage(proc, message, out)
}
}()
// Send back an ACK message.
ackMsg := []byte("confirmed from: " + node + ": " + fmt.Sprint(message.ID))
return ackMsg, nil
}
// ----
2022-05-24 07:21:48 +02:00
type methodREQKeysRequestUpdate struct {
2022-05-19 20:54:33 +02:00
event Event
}
2022-05-24 07:21:48 +02:00
func (m methodREQKeysRequestUpdate) getKind() Event {
2022-05-19 20:54:33 +02:00
return m.event
}
// Handler to get all the public ed25519 keys from a central server.
2022-05-24 07:21:48 +02:00
func (m methodREQKeysRequestUpdate) handler(proc process, message Message, node string) ([]byte, error) {
2022-05-19 20:54:33 +02:00
// Get a context with the timeout specified in message.MethodTimeout.
// TODO:
// - Since this is implemented as a NACK message we could implement a
// metric thats shows the last time a node did a key request.
// - We could also implement a metrics on the receiver showing the last
// time a node had done an update.
ctx, _ := getContextForMethodTimeout(proc.ctx, message)
proc.processes.wg.Add(1)
go func() {
defer proc.processes.wg.Done()
outCh := make(chan []byte)
go func() {
// Normally we would do some logic here, where the result is passed to outCh when done,
// so we can split up the working logic, and f.ex. sending a reply logic.
// In this case this go func and the below select is not needed, but keeping it so the
// structure is the same as the other handlers.
select {
case <-ctx.Done():
case outCh <- []byte{}:
}
}()
select {
case <-ctx.Done():
// case out := <-outCh:
case <-outCh:
// Using a func here to set the scope of the lock, and then be able to
// defer the unlock when leaving that scope.
func() {
proc.centralAuth.pki.nodesAcked.mu.Lock()
defer proc.centralAuth.pki.nodesAcked.mu.Unlock()
2022-10-05 09:16:22 +02:00
er := fmt.Errorf(" <---- methodREQKeysRequestUpdate: received hash from NODE=%v, HASH=%v", message.FromNode, message.Data)
proc.errorKernel.logDebug(er, proc.configuration)
2022-05-19 20:54:33 +02:00
// Check if the received hash is the same as the one currently active,
if bytes.Equal(proc.centralAuth.pki.nodesAcked.keysAndHash.Hash[:], message.Data) {
er := fmt.Errorf("info: methodREQKeysRequestUpdate: node %v and central have equal keys, nothing to do, exiting key update handler", message.FromNode)
// proc.errorKernel.infoSend(proc, message, er)
proc.errorKernel.logDebug(er, proc.configuration)
2022-05-19 20:54:33 +02:00
return
}
er = fmt.Errorf("info: methodREQKeysRequestUpdate: node %v and central had not equal keys, preparing to send new version of keys", message.FromNode)
proc.errorKernel.logDebug(er, proc.configuration)
2022-05-19 20:54:33 +02:00
2022-10-05 09:16:22 +02:00
er = fmt.Errorf("info: methodREQKeysRequestUpdate: marshalling new keys and hash to send: map=%v, hash=%v", proc.centralAuth.pki.nodesAcked.keysAndHash.Keys, proc.centralAuth.pki.nodesAcked.keysAndHash.Hash)
proc.errorKernel.logDebug(er, proc.configuration)
2022-05-19 20:54:33 +02:00
b, err := json.Marshal(proc.centralAuth.pki.nodesAcked.keysAndHash)
if err != nil {
2022-05-24 07:21:48 +02:00
er := fmt.Errorf("error: methodREQKeysRequestUpdate, failed to marshal keys map: %v", err)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-05-19 20:54:33 +02:00
}
2022-10-05 09:16:22 +02:00
er = fmt.Errorf("----> methodREQKeysRequestUpdate: SENDING KEYS TO NODE=%v", message.FromNode)
proc.errorKernel.logDebug(er, proc.configuration)
2022-05-19 20:54:33 +02:00
newReplyMessage(proc, message, b)
}()
}
}()
// NB: We're not sending an ACK message for this request type.
return nil, nil
}
// ----
2022-05-24 07:21:48 +02:00
type methodREQKeysDeliverUpdate struct {
2022-05-19 20:54:33 +02:00
event Event
}
2022-05-24 07:21:48 +02:00
func (m methodREQKeysDeliverUpdate) getKind() Event {
2022-05-19 20:54:33 +02:00
return m.event
}
2022-05-24 07:21:48 +02:00
// Handler to receive the public keys from a central server.
func (m methodREQKeysDeliverUpdate) handler(proc process, message Message, node string) ([]byte, error) {
2022-05-19 20:54:33 +02:00
// Get a context with the timeout specified in message.MethodTimeout.
// TODO:
// - Since this is implemented as a NACK message we could implement a
// metric thats shows the last time keys were updated.
ctx, _ := getContextForMethodTimeout(proc.ctx, message)
proc.processes.wg.Add(1)
go func() {
defer proc.processes.wg.Done()
outCh := make(chan []byte)
go func() {
// Normally we would do some logic here, where the result is passed to outCh when done,
// so we can split up the working logic, and f.ex. sending a reply logic.
// In this case this go func and the below select is not needed, but keeping it so the
// structure is the same as the other handlers.
select {
case <-ctx.Done():
case outCh <- []byte{}:
}
}()
select {
// case proc.toRingbufferCh <- []subjectAndMessage{sam}:
case <-ctx.Done():
case <-outCh:
proc.nodeAuth.publicKeys.mu.Lock()
2022-06-01 07:29:25 +02:00
var keysAndHash keysAndHash
err := json.Unmarshal(message.Data, &keysAndHash)
if err != nil {
er := fmt.Errorf("error: REQKeysDeliverUpdate : json unmarshal failed: %v, message: %v", err, message)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-06-01 07:29:25 +02:00
}
2022-10-05 09:16:22 +02:00
er := fmt.Errorf("<---- REQKeysDeliverUpdate: after unmarshal, nodeAuth keysAndhash contains: %+v", keysAndHash)
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-01 07:29:25 +02:00
// If the received map was empty we also want to delete all the locally stored keys,
// else we copy the marshaled keysAndHash we received from central into our map.
if len(keysAndHash.Keys) < 1 {
proc.nodeAuth.publicKeys.keysAndHash = newKeysAndHash()
} else {
proc.nodeAuth.publicKeys.keysAndHash = &keysAndHash
}
2022-05-19 20:54:33 +02:00
proc.nodeAuth.publicKeys.mu.Unlock()
if err != nil {
2022-05-24 07:21:48 +02:00
er := fmt.Errorf("error: REQKeysDeliverUpdate : json unmarshal failed: %v, message: %v", err, message)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-05-19 20:54:33 +02:00
}
// We need to also persist the hash on the receiving nodes. We can then load
// that key upon startup.
2022-05-19 20:54:33 +02:00
err = proc.nodeAuth.publicKeys.saveToFile()
if err != nil {
2022-05-24 07:21:48 +02:00
er := fmt.Errorf("error: REQKeysDeliverUpdate : save to file failed: %v, message: %v", err, message)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-05-19 20:54:33 +02:00
}
// Prepare and queue for sending a new message with the output
// of the action executed.
// newReplyMessage(proc, message, out)
}
}()
// Send back an ACK message.
// ackMsg := []byte("confirmed from: " + node + ": " + fmt.Sprint(message.ID))
return nil, nil
}
// ----
2022-05-24 07:21:48 +02:00
type methodREQKeysAllow struct {
2022-05-19 20:54:33 +02:00
event Event
}
2022-05-24 07:21:48 +02:00
func (m methodREQKeysAllow) getKind() Event {
2022-05-19 20:54:33 +02:00
return m.event
}
// Handler to allow new public keys into the database on central auth.
// Nodes will send the public key in the REQHello messages. When they
// are recived on the central server they will be put into a temp key
// map, and we need to acknowledge them before they are moved into the
// main key map, and then allowed to be sent out to other nodes.
2022-05-24 07:21:48 +02:00
func (m methodREQKeysAllow) handler(proc process, message Message, node string) ([]byte, error) {
2022-05-19 20:54:33 +02:00
// Get a context with the timeout specified in message.MethodTimeout.
ctx, _ := getContextForMethodTimeout(proc.ctx, message)
proc.processes.wg.Add(1)
go func() {
defer proc.processes.wg.Done()
outCh := make(chan []byte)
go func() {
// Normally we would do some logic here, where the result is passed to outCh when done,
// so we can split up the working logic, and f.ex. sending a reply logic.
// In this case this go func and the below select is not needed, but keeping it so the
// structure is the same as the other handlers.
select {
case <-ctx.Done():
case outCh <- []byte{}:
}
}()
select {
case <-ctx.Done():
case <-outCh:
proc.centralAuth.pki.nodeNotAckedPublicKeys.mu.Lock()
defer proc.centralAuth.pki.nodeNotAckedPublicKeys.mu.Unlock()
// Range over all the MethodArgs, where each element represents a node to allow,
// and move the node from the notAcked map to the allowed map.
for _, n := range message.MethodArgs {
key, ok := proc.centralAuth.pki.nodeNotAckedPublicKeys.KeyMap[Node(n)]
if ok {
func() {
proc.centralAuth.pki.nodesAcked.mu.Lock()
defer proc.centralAuth.pki.nodesAcked.mu.Unlock()
// Store/update the node and public key on the allowed pubKey map.
proc.centralAuth.pki.nodesAcked.keysAndHash.Keys[Node(n)] = key
}()
// Add key to persistent storage.
proc.centralAuth.pki.dbUpdatePublicKey(string(n), key)
// Delete the key from the NotAcked map
delete(proc.centralAuth.pki.nodeNotAckedPublicKeys.KeyMap, Node(n))
2022-05-24 07:21:48 +02:00
er := fmt.Errorf("info: REQKeysAllow : allowed new/updated public key for %v to allowed public key map", n)
2022-05-19 20:54:33 +02:00
proc.errorKernel.infoSend(proc, message, er)
}
}
// All new elements are now added, and we can create a new hash
// representing the current keys in the allowed map.
proc.centralAuth.updateHash(proc, message)
2022-05-19 20:54:33 +02:00
2022-06-02 07:05:47 +02:00
// If new keys were allowed into the main map, we should send out one
// single update to all the registered nodes to inform of an update.
// NB: If a node is not reachable at the time the update is sent it is
// not a problem since the nodes will periodically check for updates.
2022-05-31 11:05:21 +02:00
//
2022-06-02 07:05:47 +02:00
// If there are errors we will return from the function, and send no
// updates.
2022-06-02 09:36:09 +02:00
err := pushKeys(proc, message, []Node{})
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
if err != nil {
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, err, logWarning)
2022-06-02 09:36:09 +02:00
return
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
}
}()
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
ackMsg := []byte("confirmed from: " + node + ": " + fmt.Sprint(message.ID))
return ackMsg, nil
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
// pushKeys will try to push the the current keys and hashes to each node once.
// As input arguments it takes the current process, the current message, and a
// []Node in nodes.
// The nodes are used when a node or nodes have been deleted from the current
// nodesAcked map since it will contain the nodes that were deleted so we are
// also able to send an update to them as well.
func pushKeys(proc process, message Message, nodes []Node) error {
2022-10-05 09:16:22 +02:00
er := fmt.Errorf("info: beginning of pushKeys, nodes=%v", nodes)
2022-06-02 09:36:09 +02:00
var knh []byte
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-02 09:36:09 +02:00
err := func() error {
proc.centralAuth.pki.nodesAcked.mu.Lock()
defer proc.centralAuth.pki.nodesAcked.mu.Unlock()
b, err := json.Marshal(proc.centralAuth.pki.nodesAcked.keysAndHash)
if err != nil {
er := fmt.Errorf("error: methodREQKeysAllow, failed to marshal keys map: %v", err)
return er
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
copy(knh, b)
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
return nil
}()
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
if err != nil {
return err
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
// proc.centralAuth.pki.nodeNotAckedPublicKeys.mu.Lock()
// defer proc.centralAuth.pki.nodeNotAckedPublicKeys.mu.Unlock()
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
// For all nodes that is not ack'ed we try to send an update once.
for n := range proc.centralAuth.pki.nodeNotAckedPublicKeys.KeyMap {
2022-10-05 09:16:22 +02:00
er := fmt.Errorf("info: node to send REQKeysDeliverUpdate to:%v ", n)
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-02 09:36:09 +02:00
msg := Message{
ToNode: n,
Method: REQKeysDeliverUpdate,
ReplyMethod: REQNone,
ACKTimeout: 0,
2022-06-02 09:36:09 +02:00
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
sam, err := newSubjectAndMessage(msg)
if err != nil {
// In theory the system should drop the message before it reaches here.
er := fmt.Errorf("error: newSubjectAndMessage : %v, message: %v", err, message)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-06-02 09:36:09 +02:00
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
proc.toRingbufferCh <- []subjectAndMessage{sam}
2022-10-05 09:16:22 +02:00
er = fmt.Errorf("----> methodREQKeysAllow: SENDING KEYS TO NODE=%v", message.FromNode)
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-02 09:36:09 +02:00
}
// Create the data payload of the current allowed keys.
b, err := json.Marshal(proc.centralAuth.pki.nodesAcked.keysAndHash)
if err != nil {
er := fmt.Errorf("error: methodREQKeysAllow, failed to marshal keys map: %v", err)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-06-02 09:36:09 +02:00
}
proc.centralAuth.pki.nodesAcked.mu.Lock()
defer proc.centralAuth.pki.nodesAcked.mu.Unlock()
// Concatenate the current nodes in the keysAndHash map and the nodes
// we got from the function argument when this function was called.
nodeMap := make(map[Node]struct{})
for n := range proc.centralAuth.pki.nodesAcked.keysAndHash.Keys {
nodeMap[n] = struct{}{}
}
for _, n := range nodes {
nodeMap[n] = struct{}{}
}
// For all nodes that is ack'ed we try to send an update once.
for n := range nodeMap {
2022-10-05 09:16:22 +02:00
er := fmt.Errorf("info: node to send REQKeysDeliverUpdate to:%v ", n)
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-02 09:36:09 +02:00
msg := Message{
ToNode: n,
Method: REQKeysDeliverUpdate,
Data: b,
ReplyMethod: REQNone,
ACKTimeout: 0,
2022-06-02 09:36:09 +02:00
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
sam, err := newSubjectAndMessage(msg)
if err != nil {
// In theory the system should drop the message before it reaches here.
er := fmt.Errorf("error: newSubjectAndMessage : %v, message: %v", err, message)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-06-02 09:36:09 +02:00
}
2022-06-02 07:05:47 +02:00
2022-06-02 09:36:09 +02:00
proc.toRingbufferCh <- []subjectAndMessage{sam}
2022-06-02 07:05:47 +02:00
2022-10-05 09:16:22 +02:00
er = fmt.Errorf("----> methodREQKeysAllow: sending keys update to node=%v", message.FromNode)
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-02 09:36:09 +02:00
}
2022-06-02 09:36:09 +02:00
return nil
2022-05-19 20:54:33 +02:00
}
2022-06-01 07:29:25 +02:00
type methodREQKeysDelete struct {
event Event
}
func (m methodREQKeysDelete) getKind() Event {
return m.event
}
func (m methodREQKeysDelete) handler(proc process, message Message, node string) ([]byte, error) {
inf := fmt.Errorf("<--- methodREQKeysDelete received from: %v, containing: %v", message.FromNode, message.MethodArgs)
proc.errorKernel.logDebug(inf, proc.configuration)
2022-06-01 07:29:25 +02:00
proc.processes.wg.Add(1)
go func() {
defer proc.processes.wg.Done()
// Get a context with the timeout specified in message.MethodTimeout.
ctx, cancel := getContextForMethodTimeout(proc.ctx, message)
outCh := make(chan []byte)
errCh := make(chan error)
proc.processes.wg.Add(1)
go func() {
defer proc.processes.wg.Done()
switch {
case len(message.MethodArgs) < 1:
errCh <- fmt.Errorf("error: methodREQAclGroupNodesDeleteNode: got <1 number methodArgs, want >0")
return
}
// HERE:
// We want to be able to define more nodes keys to delete.
// Loop over the methodArgs, and call the keyDelete function for each node,
// or rewrite the deleteKey to deleteKeys and it takes a []node as input
// so all keys can be deleted in 1 go, and we create 1 new hash, instead
// of doing it for each node delete.
proc.centralAuth.deletePublicKeys(proc, message, message.MethodArgs)
2022-10-05 09:16:22 +02:00
er := fmt.Errorf("info: Deleted public keys: %v", message.MethodArgs)
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-01 07:29:25 +02:00
// All new elements are now added, and we can create a new hash
// representing the current keys in the allowed map.
proc.centralAuth.updateHash(proc, message)
2022-10-05 09:16:22 +02:00
er = fmt.Errorf(" * DEBUG updated hash for public keys")
proc.errorKernel.logDebug(er, proc.configuration)
2022-06-01 07:29:25 +02:00
2022-06-02 09:36:09 +02:00
var nodes []Node
for _, n := range message.MethodArgs {
nodes = append(nodes, Node(n))
}
err := pushKeys(proc, message, nodes)
if err != nil {
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, err, logWarning)
2022-06-02 09:36:09 +02:00
return
}
2022-06-01 07:29:25 +02:00
outString := fmt.Sprintf("deleted public keys for the nodes=%v\n", message.MethodArgs)
out := []byte(outString)
select {
case outCh <- out:
case <-ctx.Done():
return
}
}()
select {
case err := <-errCh:
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, err, logWarning)
2022-06-01 07:29:25 +02:00
case <-ctx.Done():
cancel()
er := fmt.Errorf("error: methodREQAclGroupNodesDeleteNode: method timed out: %v", message.MethodArgs)
2023-01-11 08:38:15 +01:00
proc.errorKernel.errSend(proc, message, er, logWarning)
2022-06-01 07:29:25 +02:00
case out := <-outCh:
2022-06-02 09:36:09 +02:00
2022-06-01 07:29:25 +02:00
newReplyMessage(proc, message, out)
}
}()
ackMsg := []byte("confirmed from: " + node + ": " + fmt.Sprint(message.ID))
return ackMsg, nil
}