Factor NodePool into its own package

2022-10-28 21:29:17 +03:00 · 2018-03-02 10:40:36 +00:00
parent 41f3956881
commit 6a8c2d3817
5 changed files with 410 additions and 398 deletions
--- a/api/agent/lb_pool.go
+++ b/api/agent/lb_pool.go
@@ -2,24 +2,8 @@ package agent

 import (
 	"context"
-	"encoding/json"
-	"io"
-	"sync"
-	"sync/atomic"
-	"time"

-	"google.golang.org/grpc"
-
-	pb "github.com/fnproject/fn/api/agent/grpc"
-	"github.com/fnproject/fn/api/id"
-	"github.com/fnproject/fn/grpcutil"
 	"github.com/fnproject/fn/poolmanager"
-	"github.com/sirupsen/logrus"
-)
-
-const (
-	// CapacityUpdatePeriod defines how often the capacity updates are sent
-	CapacityUpdatePeriod = 1 * time.Second
 )

 // NodePool is the interface to interact with Node pool manager
@@ -39,42 +23,6 @@ type Runner interface {
 // RunnerFactory is a factory func that creates a Runner usable by the pool.
 type RunnerFactory func(addr string, lbgId string, cert string, key string, ca string) (Runner, error)

-type gRPCNodePool struct {
-	npm        poolmanager.NodePoolManager
-	advertiser poolmanager.CapacityAdvertiser
-	mx         sync.RWMutex
-	lbg        map[string]*lbg // {lbgid -> *lbg}
-	generator  RunnerFactory
-	//TODO find a better place for this
-	pki pkiData
-
-	shutdown chan struct{}
-}
-
-// TODO need to go in a better place
-type pkiData struct {
-	ca   string
-	key  string
-	cert string
-}
-
-type lbg struct {
-	mx      sync.RWMutex
-	id      string
-	runners map[string]Runner
-	r_list  atomic.Value // We attempt to maintain the same order of runners as advertised by the NPM.
-	// This is to preserve as reasonable behaviour as possible for the CH algorithm
-	generator RunnerFactory
-}
-
-type gRPCRunner struct {
-	// Need a WaitGroup of TryExec in flight
-	wg      sync.WaitGroup
-	address string
-	conn    *grpc.ClientConn
-	client  pb.RunnerProtocolClient
-}
-
 type nullRunner struct{}

 func (n *nullRunner) TryExec(ctx context.Context, call Call) (bool, error) {
@@ -83,331 +31,4 @@ func (n *nullRunner) TryExec(ctx context.Context, call Call) (bool, error) {

 func (n *nullRunner) Close() {}

-func GRPCRunnerFactory(addr string, lbgID string, cert string, key string, ca string) (Runner, error) {
-	p := pkiData{
-		cert: cert,
-		key:  key,
-		ca:   ca,
-	}
-	conn, client := runnerConnection(addr, lbgID, p)
-	return &gRPCRunner{
-		address: addr,
-		conn:    conn,
-		client:  client,
-	}, nil
-}
-
-func DefaultgRPCNodePool(npmAddress string, cert string, key string, ca string) NodePool {
-	npm := poolmanager.NewNodePoolManager(npmAddress, cert, key, ca)
-	// TODO do we need to persistent this ID in order to survive restart?
-	lbID := id.New().String()
-	advertiser := poolmanager.NewCapacityAdvertiser(npm, lbID, CapacityUpdatePeriod)
-	rf := GRPCRunnerFactory
-
-	return NewgRPCNodePool(cert, key, ca, npm, advertiser, rf)
-}
-
-func NewgRPCNodePool(cert string, key string, ca string,
-	npm poolmanager.NodePoolManager,
-	advertiser poolmanager.CapacityAdvertiser,
-	rf RunnerFactory) NodePool {
-	p := pkiData{
-		ca:   ca,
-		cert: cert,
-		key:  key,
-	}
-
-	np := &gRPCNodePool{
-		npm:        npm,
-		advertiser: advertiser,
-		lbg:        make(map[string]*lbg),
-		generator:  rf,
-		shutdown:   make(chan struct{}),
-		pki:        p,
-	}
-	go np.maintenance()
-	return np
-}
-
-func (np *gRPCNodePool) Runners(lbgID string) []Runner {
-	np.mx.RLock()
-	lbg, ok := np.lbg[lbgID]
-	np.mx.RUnlock()
-
-	if !ok {
-		np.mx.Lock()
-		lbg, ok = np.lbg[lbgID]
-		if !ok {
-			lbg = newLBG(lbgID, np.generator)
-			np.lbg[lbgID] = lbg
-		}
-		np.mx.Unlock()
-	}
-
-	return lbg.runnerList()
-}
-
-func (np *gRPCNodePool) Shutdown() {
-	np.advertiser.Shutdown()
-	np.npm.Shutdown()
-}
-
-func (np *gRPCNodePool) AssignCapacity(r *poolmanager.CapacityRequest) {
-	np.advertiser.AssignCapacity(r)
-
-}
-func (np *gRPCNodePool) ReleaseCapacity(r *poolmanager.CapacityRequest) {
-	np.advertiser.ReleaseCapacity(r)
-}
-
-func (np *gRPCNodePool) maintenance() {
-	ticker := time.NewTicker(500 * time.Millisecond)
-	for {
-		select {
-		case <-np.shutdown:
-			return
-		case <-ticker.C:
-			// Reload any LBGroup information from NPM (pull for the moment, shift to listening to a stream later)
-			np.reloadLBGmembership()
-		}
-	}
-
-}
-
-func newLBG(lbgID string, generator RunnerFactory) *lbg {
-	lbg := &lbg{
-		id:        lbgID,
-		runners:   make(map[string]Runner),
-		r_list:    atomic.Value{},
-		generator: generator,
-	}
-	lbg.r_list.Store([]Runner{})
-	return lbg
-}
-
-func (np *gRPCNodePool) reloadLBGmembership() {
-	np.mx.RLock()
-	lbgroups := np.lbg
-	np.mx.RUnlock()
-	for lbgID, lbg := range lbgroups {
-		lbg.reloadMembers(lbgID, np.npm, np.pki)
-	}
-}
-
-func (lbg *lbg) runnerList() []Runner {
-	orig_runners := lbg.r_list.Load().([]Runner)
-	// XXX: Return a copy. If we required this to be immutably read by the caller, we could return the structure directly
-	runners := make([]Runner, len(orig_runners))
-	for i, r := range orig_runners {
-		runners[i] = r
-	}
-	return runners
-}
-
-func (lbg *lbg) reloadMembers(lbgID string, npm poolmanager.NodePoolManager, p pkiData) {
-
-	runners, err := npm.GetRunners(lbgID)
-	if err != nil {
-		logrus.Debug("Failed to get the list of runners from node pool manager")
-	}
-	lbg.mx.Lock()
-	defer lbg.mx.Unlock()
-	r_list := make([]Runner, len(runners))
-	seen := map[string]bool{} // If we've seen a particular runner or not
-	var errGenerator error
-	for i, addr := range runners {
-		r, ok := lbg.runners[addr]
-		if !ok {
-			logrus.WithField("runner_addr", addr).Debug("New Runner to be added")
-			r, errGenerator = lbg.generator(addr, lbgID, p.cert, p.key, p.ca)
-			if errGenerator != nil {
-				logrus.WithField("runner_addr", addr).Debug("Creation of the new runner failed")
-			} else {
-				lbg.runners[addr] = r
-			}
-		}
-		if errGenerator == nil {
-			r_list[i] = r // Maintain the delivered order
-		} else {
-			// some algorithms (like consistent hash) work better if the i'th element
-			// of r_list points to the same node on all LBs, so insert a placeholder
-			// if we can't create the runner for some reason"
-			r_list[i] = &nullRunner{}
-		}
-
-		seen[addr] = true
-	}
-	lbg.r_list.Store(r_list)
-
-	// Remove any runners that we have not encountered
-	for addr, r := range lbg.runners {
-		if _, ok := seen[addr]; !ok {
-			logrus.WithField("runner_addr", addr).Debug("Removing drained runner")
-			delete(lbg.runners, addr)
-			r.Close()
-		}
-	}
-}
-
-func (r *gRPCRunner) Close() {
-	go func() {
-		r.wg.Wait()
-		r.conn.Close()
-	}()
-}
-
-func runnerConnection(address, lbGroupID string, pki pkiData) (*grpc.ClientConn, pb.RunnerProtocolClient) {
-	ctx := context.Background()
-
-	creds, err := grpcutil.CreateCredentials(pki.cert, pki.key, pki.ca)
-	if err != nil {
-		logrus.WithError(err).Error("Unable to create credentials to connect to runner node")
-
-	}
-	conn, err := grpcutil.DialWithBackoff(ctx, address, creds, grpc.DefaultBackoffConfig)
-
-	if err != nil {
-		logrus.WithError(err).Error("Unable to connect to runner node")
-	}
-
-	protocolClient := pb.NewRunnerProtocolClient(conn)
-	logrus.WithField("lbg_id", lbGroupID).WithField("runner_addr", address).Info("Connected to runner")
-
-	return conn, protocolClient
-}
-
-func (r *gRPCRunner) TryExec(ctx context.Context, call Call) (bool, error) {
-	logrus.WithField("runner_addr", r.address).Debug("Attempting to place call")
-	r.wg.Add(1)
-	defer r.wg.Done()
-
-	// Get app and route information
-	// Construct model.Call with CONFIG in it already
-	modelJSON, err := json.Marshal(call.Model())
-	if err != nil {
-		logrus.WithError(err).Error("Failed to encode model as JSON")
-		// If we can't encode the model, no runner will ever be able to run this. Give up.
-		return true, err
-	}
-	runnerConnection, err := r.client.Engage(context.Background())
-	if err != nil {
-		logrus.WithError(err).Error("Unable to create client to runner node")
-		// Try on next runner
-		return false, err
-	}
-
-	err = runnerConnection.Send(&pb.ClientMsg{Body: &pb.ClientMsg_Try{Try: &pb.TryCall{ModelsCallJson: string(modelJSON)}}})
-	if err != nil {
-		logrus.WithError(err).Error("Failed to send message to runner node")
-		return false, err
-	}
-	msg, err := runnerConnection.Recv()
-	if err != nil {
-		logrus.WithError(err).Error("Failed to receive first message from runner node")
-		return false, err
-	}
-
-	switch body := msg.Body.(type) {
-	case *pb.RunnerMsg_Acknowledged:
-		if !body.Acknowledged.Committed {
-			logrus.Errorf("Runner didn't commit invocation request: %v", body.Acknowledged.Details)
-			return false, nil
-			// Try the next runner
-		}
-		logrus.Info("Runner committed invocation request, sending data frames")
-		done := make(chan error)
-		go receiveFromRunner(runnerConnection, call, done)
-		sendToRunner(call, runnerConnection)
-		return true, <-done
-
-	default:
-		logrus.Info("Unhandled message type received from runner: %v\n", msg)
-		return true, nil
-	}
-
-}
-
-func sendToRunner(call Call, protocolClient pb.RunnerProtocol_EngageClient) error {
-	bodyReader, err := RequestReader(&call)
-	if err != nil {
-		logrus.WithError(err).Error("Unable to get reader for request body")
-		return err
-	}
-	writeBufferSize := 10 * 1024 // 10KB
-	writeBuffer := make([]byte, writeBufferSize)
-	for {
-		n, err := bodyReader.Read(writeBuffer)
-		logrus.Debugf("Wrote %v bytes to the runner", n)
-
-		if err == io.EOF {
-			err = protocolClient.Send(&pb.ClientMsg{
-				Body: &pb.ClientMsg_Data{
-					Data: &pb.DataFrame{
-						Data: writeBuffer,
-						Eof:  true,
-					},
-				},
-			})
-			if err != nil {
-				logrus.WithError(err).Error("Failed to send data frame with EOF to runner")
-			}
-			break
-		}
-		err = protocolClient.Send(&pb.ClientMsg{
-			Body: &pb.ClientMsg_Data{
-				Data: &pb.DataFrame{
-					Data: writeBuffer,
-					Eof:  false,
-				},
-			},
-		})
-		if err != nil {
-			logrus.WithError(err).Error("Failed to send data frame")
-			return err
-		}
-	}
-	return nil
-}
-
-func receiveFromRunner(protocolClient pb.RunnerProtocol_EngageClient, call Call, done chan error) {
-	w, err := ResponseWriter(&call)
-
-	if err != nil {
-		logrus.WithError(err).Error("Unable to get response writer from call")
-		done <- err
-		return
-	}
-
-	for {
-		msg, err := protocolClient.Recv()
-		if err != nil {
-			logrus.WithError(err).Error("Failed to receive message from runner")
-			done <- err
-			return
-		}
-
-		switch body := msg.Body.(type) {
-		case *pb.RunnerMsg_ResultStart:
-			switch meta := body.ResultStart.Meta.(type) {
-			case *pb.CallResultStart_Http:
-				for _, header := range meta.Http.Headers {
-					(*w).Header().Set(header.Key, header.Value)
-				}
-			default:
-				logrus.Errorf("Unhandled meta type in start message: %v", meta)
-			}
-		case *pb.RunnerMsg_Data:
-			(*w).Write(body.Data.Data)
-		case *pb.RunnerMsg_Finished:
-			if body.Finished.Success {
-				logrus.Infof("Call finished successfully: %v", body.Finished.Details)
-			} else {
-				logrus.Infof("Call finish unsuccessfully:: %v", body.Finished.Details)
-			}
-			close(done)
-			return
-		default:
-			logrus.Errorf("Unhandled message type from runner: %v", body)
-		}
-	}
-}
+var NullRunner Runner = &nullRunner{}
--- a/api/agent/nodepool/grpc/grpc_pool.go
+++ b/api/agent/nodepool/grpc/grpc_pool.go
@@ -0,0 +1,389 @@
+package grpc
+
+import (
+	"context"
+	"encoding/json"
+	"io"
+	"sync"
+	"sync/atomic"
+	"time"
+
+	"google.golang.org/grpc"
+
+	"github.com/fnproject/fn/api/agent"
+	pb "github.com/fnproject/fn/api/agent/grpc"
+	"github.com/fnproject/fn/api/id"
+	"github.com/fnproject/fn/grpcutil"
+	"github.com/fnproject/fn/poolmanager"
+	"github.com/sirupsen/logrus"
+)
+
+const (
+	// CapacityUpdatePeriod defines how often the capacity updates are sent
+	CapacityUpdatePeriod = 1 * time.Second
+)
+
+type gRPCNodePool struct {
+	npm        poolmanager.NodePoolManager
+	advertiser poolmanager.CapacityAdvertiser
+	mx         sync.RWMutex
+	lbg        map[string]*lbg // {lbgid -> *lbg}
+	generator  agent.RunnerFactory
+	//TODO find a better place for this
+	pki pkiData
+
+	shutdown chan struct{}
+}
+
+// TODO need to go in a better place
+type pkiData struct {
+	ca   string
+	key  string
+	cert string
+}
+
+type lbg struct {
+	mx      sync.RWMutex
+	id      string
+	runners map[string]agent.Runner
+	r_list  atomic.Value // We attempt to maintain the same order of runners as advertised by the NPM.
+	// This is to preserve as reasonable behaviour as possible for the CH algorithm
+	generator agent.RunnerFactory
+}
+
+type gRPCRunner struct {
+	// Need a WaitGroup of TryExec in flight
+	wg      sync.WaitGroup
+	address string
+	conn    *grpc.ClientConn
+	client  pb.RunnerProtocolClient
+}
+
+func GRPCRunnerFactory(addr string, lbgID string, cert string, key string, ca string) (agent.Runner, error) {
+	p := pkiData{
+		cert: cert,
+		key:  key,
+		ca:   ca,
+	}
+	conn, client := runnerConnection(addr, lbgID, p)
+	return &gRPCRunner{
+		address: addr,
+		conn:    conn,
+		client:  client,
+	}, nil
+}
+
+func DefaultgRPCNodePool(npmAddress string, cert string, key string, ca string) agent.NodePool {
+	npm := poolmanager.NewNodePoolManager(npmAddress, cert, key, ca)
+	// TODO do we need to persistent this ID in order to survive restart?
+	lbID := id.New().String()
+	advertiser := poolmanager.NewCapacityAdvertiser(npm, lbID, CapacityUpdatePeriod)
+	rf := GRPCRunnerFactory
+
+	return NewgRPCNodePool(cert, key, ca, npm, advertiser, rf)
+}
+
+func NewgRPCNodePool(cert string, key string, ca string,
+	npm poolmanager.NodePoolManager,
+	advertiser poolmanager.CapacityAdvertiser,
+	rf agent.RunnerFactory) agent.NodePool {
+	p := pkiData{
+		ca:   ca,
+		cert: cert,
+		key:  key,
+	}
+
+	np := &gRPCNodePool{
+		npm:        npm,
+		advertiser: advertiser,
+		lbg:        make(map[string]*lbg),
+		generator:  rf,
+		shutdown:   make(chan struct{}),
+		pki:        p,
+	}
+	go np.maintenance()
+	return np
+}
+
+func (np *gRPCNodePool) Runners(lbgID string) []agent.Runner {
+	np.mx.RLock()
+	lbg, ok := np.lbg[lbgID]
+	np.mx.RUnlock()
+
+	if !ok {
+		np.mx.Lock()
+		lbg, ok = np.lbg[lbgID]
+		if !ok {
+			lbg = newLBG(lbgID, np.generator)
+			np.lbg[lbgID] = lbg
+		}
+		np.mx.Unlock()
+	}
+
+	return lbg.runnerList()
+}
+
+func (np *gRPCNodePool) Shutdown() {
+	np.advertiser.Shutdown()
+	np.npm.Shutdown()
+}
+
+func (np *gRPCNodePool) AssignCapacity(r *poolmanager.CapacityRequest) {
+	np.advertiser.AssignCapacity(r)
+
+}
+func (np *gRPCNodePool) ReleaseCapacity(r *poolmanager.CapacityRequest) {
+	np.advertiser.ReleaseCapacity(r)
+}
+
+func (np *gRPCNodePool) maintenance() {
+	ticker := time.NewTicker(500 * time.Millisecond)
+	for {
+		select {
+		case <-np.shutdown:
+			return
+		case <-ticker.C:
+			// Reload any LBGroup information from NPM (pull for the moment, shift to listening to a stream later)
+			np.reloadLBGmembership()
+		}
+	}
+
+}
+
+func newLBG(lbgID string, generator agent.RunnerFactory) *lbg {
+	lbg := &lbg{
+		id:        lbgID,
+		runners:   make(map[string]agent.Runner),
+		r_list:    atomic.Value{},
+		generator: generator,
+	}
+	lbg.r_list.Store([]agent.Runner{})
+	return lbg
+}
+
+func (np *gRPCNodePool) reloadLBGmembership() {
+	np.mx.RLock()
+	lbgroups := np.lbg
+	np.mx.RUnlock()
+	for lbgID, lbg := range lbgroups {
+		lbg.reloadMembers(lbgID, np.npm, np.pki)
+	}
+}
+
+func (lbg *lbg) runnerList() []agent.Runner {
+	orig_runners := lbg.r_list.Load().([]agent.Runner)
+	// XXX: Return a copy. If we required this to be immutably read by the caller, we could return the structure directly
+	runners := make([]agent.Runner, len(orig_runners))
+	for i, r := range orig_runners {
+		runners[i] = r
+	}
+	return runners
+}
+
+func (lbg *lbg) reloadMembers(lbgID string, npm poolmanager.NodePoolManager, p pkiData) {
+
+	runners, err := npm.GetRunners(lbgID)
+	if err != nil {
+		logrus.Debug("Failed to get the list of runners from node pool manager")
+	}
+	lbg.mx.Lock()
+	defer lbg.mx.Unlock()
+	r_list := make([]agent.Runner, len(runners))
+	seen := map[string]bool{} // If we've seen a particular runner or not
+	var errGenerator error
+	for i, addr := range runners {
+		r, ok := lbg.runners[addr]
+		if !ok {
+			logrus.WithField("runner_addr", addr).Debug("New Runner to be added")
+			r, errGenerator = lbg.generator(addr, lbgID, p.cert, p.key, p.ca)
+			if errGenerator != nil {
+				logrus.WithField("runner_addr", addr).Debug("Creation of the new runner failed")
+			} else {
+				lbg.runners[addr] = r
+			}
+		}
+		if errGenerator == nil {
+			r_list[i] = r // Maintain the delivered order
+		} else {
+			// some algorithms (like consistent hash) work better if the i'th element
+			// of r_list points to the same node on all LBs, so insert a placeholder
+			// if we can't create the runner for some reason"
+			r_list[i] = agent.NullRunner
+		}
+
+		seen[addr] = true
+	}
+	lbg.r_list.Store(r_list)
+
+	// Remove any runners that we have not encountered
+	for addr, r := range lbg.runners {
+		if _, ok := seen[addr]; !ok {
+			logrus.WithField("runner_addr", addr).Debug("Removing drained runner")
+			delete(lbg.runners, addr)
+			r.Close()
+		}
+	}
+}
+
+func (r *gRPCRunner) Close() {
+	go func() {
+		r.wg.Wait()
+		r.conn.Close()
+	}()
+}
+
+func runnerConnection(address, lbGroupID string, pki pkiData) (*grpc.ClientConn, pb.RunnerProtocolClient) {
+	ctx := context.Background()
+
+	creds, err := grpcutil.CreateCredentials(pki.cert, pki.key, pki.ca)
+	if err != nil {
+		logrus.WithError(err).Error("Unable to create credentials to connect to runner node")
+
+	}
+	conn, err := grpcutil.DialWithBackoff(ctx, address, creds, grpc.DefaultBackoffConfig)
+
+	if err != nil {
+		logrus.WithError(err).Error("Unable to connect to runner node")
+	}
+
+	protocolClient := pb.NewRunnerProtocolClient(conn)
+	logrus.WithField("lbg_id", lbGroupID).WithField("runner_addr", address).Info("Connected to runner")
+
+	return conn, protocolClient
+}
+
+func (r *gRPCRunner) TryExec(ctx context.Context, call agent.Call) (bool, error) {
+	logrus.WithField("runner_addr", r.address).Debug("Attempting to place call")
+	r.wg.Add(1)
+	defer r.wg.Done()
+
+	// Get app and route information
+	// Construct model.Call with CONFIG in it already
+	modelJSON, err := json.Marshal(call.Model())
+	if err != nil {
+		logrus.WithError(err).Error("Failed to encode model as JSON")
+		// If we can't encode the model, no runner will ever be able to run this. Give up.
+		return true, err
+	}
+	runnerConnection, err := r.client.Engage(context.Background())
+	if err != nil {
+		logrus.WithError(err).Error("Unable to create client to runner node")
+		// Try on next runner
+		return false, err
+	}
+
+	err = runnerConnection.Send(&pb.ClientMsg{Body: &pb.ClientMsg_Try{Try: &pb.TryCall{ModelsCallJson: string(modelJSON)}}})
+	if err != nil {
+		logrus.WithError(err).Error("Failed to send message to runner node")
+		return false, err
+	}
+	msg, err := runnerConnection.Recv()
+	if err != nil {
+		logrus.WithError(err).Error("Failed to receive first message from runner node")
+		return false, err
+	}
+
+	switch body := msg.Body.(type) {
+	case *pb.RunnerMsg_Acknowledged:
+		if !body.Acknowledged.Committed {
+			logrus.Errorf("Runner didn't commit invocation request: %v", body.Acknowledged.Details)
+			return false, nil
+			// Try the next runner
+		}
+		logrus.Info("Runner committed invocation request, sending data frames")
+		done := make(chan error)
+		go receiveFromRunner(runnerConnection, call, done)
+		sendToRunner(call, runnerConnection)
+		return true, <-done
+
+	default:
+		logrus.Info("Unhandled message type received from runner: %v\n", msg)
+		return true, nil
+	}
+
+}
+
+func sendToRunner(call agent.Call, protocolClient pb.RunnerProtocol_EngageClient) error {
+	bodyReader, err := agent.RequestReader(&call)
+	if err != nil {
+		logrus.WithError(err).Error("Unable to get reader for request body")
+		return err
+	}
+	writeBufferSize := 10 * 1024 // 10KB
+	writeBuffer := make([]byte, writeBufferSize)
+	for {
+		n, err := bodyReader.Read(writeBuffer)
+		logrus.Debugf("Wrote %v bytes to the runner", n)
+
+		if err == io.EOF {
+			err = protocolClient.Send(&pb.ClientMsg{
+				Body: &pb.ClientMsg_Data{
+					Data: &pb.DataFrame{
+						Data: writeBuffer,
+						Eof:  true,
+					},
+				},
+			})
+			if err != nil {
+				logrus.WithError(err).Error("Failed to send data frame with EOF to runner")
+			}
+			break
+		}
+		err = protocolClient.Send(&pb.ClientMsg{
+			Body: &pb.ClientMsg_Data{
+				Data: &pb.DataFrame{
+					Data: writeBuffer,
+					Eof:  false,
+				},
+			},
+		})
+		if err != nil {
+			logrus.WithError(err).Error("Failed to send data frame")
+			return err
+		}
+	}
+	return nil
+}
+
+func receiveFromRunner(protocolClient pb.RunnerProtocol_EngageClient, call agent.Call, done chan error) {
+	w, err := agent.ResponseWriter(&call)
+
+	if err != nil {
+		logrus.WithError(err).Error("Unable to get response writer from call")
+		done <- err
+		return
+	}
+
+	for {
+		msg, err := protocolClient.Recv()
+		if err != nil {
+			logrus.WithError(err).Error("Failed to receive message from runner")
+			done <- err
+			return
+		}
+
+		switch body := msg.Body.(type) {
+		case *pb.RunnerMsg_ResultStart:
+			switch meta := body.ResultStart.Meta.(type) {
+			case *pb.CallResultStart_Http:
+				for _, header := range meta.Http.Headers {
+					(*w).Header().Set(header.Key, header.Value)
+				}
+			default:
+				logrus.Errorf("Unhandled meta type in start message: %v", meta)
+			}
+		case *pb.RunnerMsg_Data:
+			(*w).Write(body.Data.Data)
+		case *pb.RunnerMsg_Finished:
+			if body.Finished.Success {
+				logrus.Infof("Call finished successfully: %v", body.Finished.Details)
+			} else {
+				logrus.Infof("Call finish unsuccessfully:: %v", body.Finished.Details)
+			}
+			close(done)
+			return
+		default:
+			logrus.Errorf("Unhandled message type from runner: %v", body)
+		}
+	}
+}
--- a/api/agent/nodepool/grpc/lb_test.go
+++ b/api/agent/nodepool/grpc/lb_test.go
@@ -1,4 +1,4 @@
-package agent
+package grpc

 import (
 	"context"
@@ -8,6 +8,7 @@ import (
 	"testing"
 	"time"

+	"github.com/fnproject/fn/api/agent"
 	"github.com/fnproject/fn/api/models"
 	"github.com/fnproject/fn/poolmanager"
 	model "github.com/fnproject/fn/poolmanager/grpc"
@@ -29,11 +30,11 @@ type mockNodePoolManager struct {
 type mockgRPCNodePool struct {
 	npm       poolmanager.NodePoolManager
 	lbg       map[string]*lbg
-	generator RunnerFactory
+	generator agent.RunnerFactory
 	pki       pkiData
 }

-func newMockgRPCNodePool(rf RunnerFactory, runners []string) *mockgRPCNodePool {
+func newMockgRPCNodePool(rf agent.RunnerFactory, runners []string) *mockgRPCNodePool {
 	npm := &mockNodePoolManager{runners: runners}

 	return &mockgRPCNodePool{
@@ -56,8 +57,8 @@ func (npm *mockNodePoolManager) Shutdown() error {
 	return nil
 }

-func NewMockRunnerFactory(sleep time.Duration, maxCalls int32) RunnerFactory {
-	return func(addr string, lbgID string, cert string, key string, ca string) (Runner, error) {
+func NewMockRunnerFactory(sleep time.Duration, maxCalls int32) agent.RunnerFactory {
+	return func(addr string, lbgID string, cert string, key string, ca string) (agent.Runner, error) {
 		return &mockRunner{
 			sleep:    sleep,
 			maxCalls: maxCalls,
@@ -66,8 +67,8 @@ func NewMockRunnerFactory(sleep time.Duration, maxCalls int32) RunnerFactory {
 	}
 }

-func FaultyRunnerFactory() RunnerFactory {
-	return func(addr string, lbgID string, cert string, key string, ca string) (Runner, error) {
+func FaultyRunnerFactory() agent.RunnerFactory {
+	return func(addr string, lbgID string, cert string, key string, ca string) (agent.Runner, error) {
 		return &mockRunner{
 			addr: addr,
 		}, errors.New("Creation of new runner failed")
@@ -90,7 +91,7 @@ func (r *mockRunner) decrCalls() {
 	r.curCalls--
 }

-func (r *mockRunner) TryExec(ctx context.Context, call Call) (bool, error) {
+func (r *mockRunner) TryExec(ctx context.Context, call agent.Call) (bool, error) {
 	err := r.checkAndIncrCalls()
 	if err != nil {
 		return false, err
@@ -102,7 +103,7 @@ func (r *mockRunner) TryExec(ctx context.Context, call Call) (bool, error) {

 	time.Sleep(r.sleep)

-	w, err := ResponseWriter(&call)
+	w, err := agent.ResponseWriter(&call)
 	if err != nil {
 		return true, err
 	}
@@ -129,7 +130,7 @@ func setupMockNodePool(lbgID string, expectedRunners []string) (*mockgRPCNodePoo
 	return np, lb
 }

-func checkRunners(t *testing.T, expectedRunners []string, actualRunners map[string]Runner, ordList []Runner) {
+func checkRunners(t *testing.T, expectedRunners []string, actualRunners map[string]agent.Runner, ordList []agent.Runner) {
 	if len(expectedRunners) != len(actualRunners) {
 		t.Errorf("List of runners is wrong, expected: %d got: %d", len(expectedRunners), len(actualRunners))
 	}
@@ -152,7 +153,7 @@ func TestReloadMembersNoRunners(t *testing.T) {

 	np.lbg[lbgID].reloadMembers(lbgID, np.npm, np.pki)
 	expectedRunners := []string{}
-	ordList := lb.r_list.Load().([]Runner)
+	ordList := lb.r_list.Load().([]agent.Runner)
 	checkRunners(t, expectedRunners, lb.runners, ordList)
 }

@@ -162,7 +163,7 @@ func TestReloadMembersNewRunners(t *testing.T) {
 	np, lb := setupMockNodePool(lbgID, expectedRunners)

 	np.lbg[lbgID].reloadMembers(lbgID, np.npm, np.pki)
-	ordList := lb.r_list.Load().([]Runner)
+	ordList := lb.r_list.Load().([]agent.Runner)
 	checkRunners(t, expectedRunners, lb.runners, ordList)
 }

@@ -186,7 +187,7 @@ func TestReloadMembersRemoveRunners(t *testing.T) {
 	}

 	np.lbg[lbgID].reloadMembers(lbgID, np.npm, np.pki)
-	ordList := lb.r_list.Load().([]Runner)
+	ordList := lb.r_list.Load().([]agent.Runner)
 	checkRunners(t, expectedRunners, lb.runners, ordList)
 }

@@ -201,9 +202,8 @@ func TestReloadMembersFailToCreateNewRunners(t *testing.T) {
 	if len(actualRunners) != 0 {
 		t.Errorf("List of runners should be empty")
 	}
-	ordList := lb.r_list.Load().([]Runner)
-	_, ok := ordList[0].(*nullRunner)
-	if !ok {
+	ordList := lb.r_list.Load().([]agent.Runner)
+	if ordList[0] != agent.NullRunner {
 		t.Errorf("Ordered list should have a nullRunner")
 	}
 }
--- a/api/server/server.go
+++ b/api/server/server.go
@@ -17,6 +17,7 @@ import (

 	"github.com/fnproject/fn/api/agent"
 	"github.com/fnproject/fn/api/agent/hybrid"
+	agent_grpc "github.com/fnproject/fn/api/agent/nodepool/grpc"
 	"github.com/fnproject/fn/api/common"
 	"github.com/fnproject/fn/api/datastore"
 	"github.com/fnproject/fn/api/id"
@@ -395,7 +396,7 @@ func WithAgentFromEnv() ServerOption {
 				return err
 			}
 			delegatedAgent := agent.New(agent.NewCachedDataAccess(cl))
-			nodePool := agent.DefaultgRPCNodePool(npmAddress, s.cert, s.certKey, s.certAuthority)
+			nodePool := agent_grpc.DefaultgRPCNodePool(npmAddress, s.cert, s.certKey, s.certAuthority)
 			// Select the placement algorithm
 			var placer agent.Placer
 			switch getEnv(EnvLBPlacementAlg, "") {
--- a/test/fn-system-tests/system_test.go
+++ b/test/fn-system-tests/system_test.go
@@ -7,6 +7,7 @@ import (

 	"github.com/fnproject/fn/api/agent"
 	"github.com/fnproject/fn/api/agent/hybrid"
+	agent_grpc "github.com/fnproject/fn/api/agent/nodepool/grpc"
 	"github.com/fnproject/fn/api/server"
 	"github.com/fnproject/fn/poolmanager"

@@ -26,7 +27,7 @@ type SystemTestNodePool struct {
 }

 func NewSystemTestNodePool() (agent.NodePool, error) {
-	factory := agent.GRPCRunnerFactory
+	factory := agent_grpc.GRPCRunnerFactory
 	addr0 := fmt.Sprintf("%s:9190", whoAmI())
 	addr1 := fmt.Sprintf("%s:9191", whoAmI())
 	addr2 := fmt.Sprintf("%s:9192", whoAmI())