2024-07-19 13:28:48 +00:00
|
|
|
package plug
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2024-08-26 08:51:00 +00:00
|
|
|
|
2024-08-17 18:23:11 +00:00
|
|
|
"git.anthrove.art/Anthrove/otter-space-sdk/v3/pkg/database"
|
2024-08-14 14:06:53 +00:00
|
|
|
"git.anthrove.art/Anthrove/otter-space-sdk/v3/pkg/models"
|
2024-08-14 14:16:42 +00:00
|
|
|
gRPC "git.anthrove.art/Anthrove/plug-sdk/v3/pkg/grpc"
|
2024-07-19 13:28:48 +00:00
|
|
|
gonanoid "github.com/matoous/go-nanoid/v2"
|
2024-08-26 13:42:42 +00:00
|
|
|
log "github.com/sirupsen/logrus"
|
|
|
|
"go.opentelemetry.io/otel/attribute"
|
|
|
|
"go.opentelemetry.io/otel/codes"
|
|
|
|
"go.opentelemetry.io/otel/trace"
|
2024-07-19 13:28:48 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type server struct {
|
|
|
|
gRPC.UnimplementedPlugConnectorServer
|
|
|
|
ctx map[string]context.CancelFunc
|
|
|
|
taskExecutionFunction TaskExecution
|
|
|
|
sendMessageExecution SendMessageExecution
|
|
|
|
getMessageExecution GetMessageExecution
|
2024-08-15 07:56:40 +00:00
|
|
|
source models.Source
|
2024-07-19 13:28:48 +00:00
|
|
|
}
|
|
|
|
|
2024-08-15 07:56:40 +00:00
|
|
|
func NewGrpcServer(source models.Source, taskExecutionFunction TaskExecution, sendMessageExecution SendMessageExecution, getMessageExecution GetMessageExecution) gRPC.PlugConnectorServer {
|
2024-07-19 13:28:48 +00:00
|
|
|
return &server{
|
|
|
|
ctx: make(map[string]context.CancelFunc),
|
|
|
|
taskExecutionFunction: taskExecutionFunction,
|
|
|
|
sendMessageExecution: sendMessageExecution,
|
|
|
|
getMessageExecution: getMessageExecution,
|
2024-08-15 07:56:40 +00:00
|
|
|
source: source,
|
2024-07-19 13:28:48 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (s *server) TaskStart(ctx context.Context, creation *gRPC.PlugTaskCreation) (*gRPC.PlugTaskStatus, error) {
|
2024-08-26 13:42:42 +00:00
|
|
|
ctx, span := tracer.Start(ctx, "TaskStart")
|
|
|
|
defer span.End()
|
|
|
|
|
2024-07-19 13:28:48 +00:00
|
|
|
var plugTaskState gRPC.PlugTaskStatus
|
|
|
|
|
|
|
|
id, err := gonanoid.New()
|
|
|
|
if err != nil {
|
2024-08-26 13:42:42 +00:00
|
|
|
span.RecordError(err)
|
|
|
|
span.SetStatus(codes.Error, err.Error())
|
2024-07-19 13:28:48 +00:00
|
|
|
return nil, err
|
|
|
|
}
|
2024-08-26 13:42:42 +00:00
|
|
|
span.AddEvent("Generated task ID", trace.WithAttributes(attribute.String("task_id", id)))
|
2024-07-19 13:28:48 +00:00
|
|
|
|
|
|
|
plugTaskState.TaskId = id
|
|
|
|
plugTaskState.TaskState = gRPC.PlugTaskState_RUNNING
|
|
|
|
|
2024-08-17 18:23:11 +00:00
|
|
|
userSource, err := database.GetUserSourceByID(ctx, models.UserSourceID(creation.UserSourceId))
|
|
|
|
if err != nil {
|
2024-08-26 13:42:42 +00:00
|
|
|
span.RecordError(err)
|
|
|
|
span.SetStatus(codes.Error, err.Error())
|
2024-08-17 18:23:11 +00:00
|
|
|
return nil, err
|
|
|
|
}
|
2024-08-26 13:42:42 +00:00
|
|
|
span.AddEvent("Retrieved user source", trace.WithAttributes(attribute.String("user_source_id", creation.UserSourceId)))
|
2024-07-19 13:28:48 +00:00
|
|
|
|
|
|
|
// gRPC closes the context after the call ended. So the whole scrapping stopped without waiting
|
|
|
|
// by using this method we assign a new context to each new request we get.
|
|
|
|
// This can be used for example to close the context with the given id
|
2024-08-26 14:44:50 +00:00
|
|
|
ctx = trace.ContextWithSpanContext(context.Background(), trace.NewSpanContext(trace.SpanContextConfig{TraceID: span.SpanContext().TraceID()}))
|
2024-08-26 14:38:14 +00:00
|
|
|
taskCtx, cancel := context.WithCancel(ctx)
|
2024-07-19 13:28:48 +00:00
|
|
|
s.ctx[id] = cancel
|
2024-08-26 13:42:42 +00:00
|
|
|
span.AddEvent("Created new context for task", trace.WithAttributes(attribute.String("task_id", id)))
|
|
|
|
|
2024-08-26 14:38:14 +00:00
|
|
|
log.WithContext(taskCtx).WithFields(log.Fields{
|
2024-08-26 13:42:42 +00:00
|
|
|
"task_id": id,
|
|
|
|
"user_source_id": creation.UserSourceId,
|
|
|
|
}).Info("Starting task")
|
2024-07-19 13:28:48 +00:00
|
|
|
|
|
|
|
go func() {
|
2024-08-26 13:42:42 +00:00
|
|
|
err := s.taskExecutionFunction(taskCtx, userSource, creation.DeepScrape, creation.ApiKey, func() {
|
2024-07-19 13:28:48 +00:00
|
|
|
s.removeTask(id)
|
|
|
|
})
|
|
|
|
if err != nil {
|
2024-08-26 13:42:42 +00:00
|
|
|
log.WithContext(taskCtx).WithError(err).WithField("task_id", id).Error("Task execution failed")
|
|
|
|
span.RecordError(err)
|
|
|
|
span.SetStatus(codes.Error, err.Error())
|
|
|
|
} else {
|
|
|
|
log.WithContext(taskCtx).WithField("task_id", id).Info("Task completed successfully")
|
|
|
|
span.AddEvent("Task completed successfully", trace.WithAttributes(attribute.String("task_id", id)))
|
2024-07-19 13:28:48 +00:00
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
2024-08-26 13:42:42 +00:00
|
|
|
span.SetAttributes(attribute.String("task_id", id))
|
2024-07-19 13:28:48 +00:00
|
|
|
return &plugTaskState, nil
|
|
|
|
}
|
|
|
|
|
2024-08-26 13:42:42 +00:00
|
|
|
func (s *server) TaskStatus(ctx context.Context, task *gRPC.PlugTask) (*gRPC.PlugTaskStatus, error) {
|
|
|
|
ctx, span := tracer.Start(ctx, "TaskStatus")
|
|
|
|
defer span.End()
|
|
|
|
|
2024-07-19 13:28:48 +00:00
|
|
|
var plugTaskState gRPC.PlugTaskStatus
|
|
|
|
|
|
|
|
_, found := s.ctx[task.TaskId]
|
|
|
|
plugTaskState.TaskId = task.TaskId
|
|
|
|
|
|
|
|
plugTaskState.TaskState = gRPC.PlugTaskState_RUNNING
|
|
|
|
|
|
|
|
if !found {
|
|
|
|
plugTaskState.TaskState = gRPC.PlugTaskState_UNKNOWN
|
|
|
|
}
|
2024-08-26 13:42:42 +00:00
|
|
|
span.AddEvent("Determined task state", trace.WithAttributes(attribute.String("task_id", task.TaskId), attribute.String("task_state", plugTaskState.TaskState.String())))
|
|
|
|
|
|
|
|
log.WithContext(ctx).WithFields(log.Fields{
|
|
|
|
"task_id": task.TaskId,
|
|
|
|
"task_state": plugTaskState.TaskState,
|
|
|
|
}).Info("Task status requested")
|
|
|
|
|
|
|
|
span.SetAttributes(attribute.String("task_id", task.TaskId))
|
2024-07-19 13:28:48 +00:00
|
|
|
return &plugTaskState, nil
|
|
|
|
}
|
|
|
|
|
2024-08-26 13:42:42 +00:00
|
|
|
func (s *server) TaskCancel(ctx context.Context, task *gRPC.PlugTask) (*gRPC.PlugTaskStatus, error) {
|
|
|
|
ctx, span := tracer.Start(ctx, "TaskCancel")
|
|
|
|
defer span.End()
|
|
|
|
|
2024-07-19 13:28:48 +00:00
|
|
|
var plugTaskState gRPC.PlugTaskStatus
|
|
|
|
|
|
|
|
plugTaskState.TaskState = gRPC.PlugTaskState_STOPPED
|
|
|
|
plugTaskState.TaskId = task.TaskId
|
|
|
|
|
|
|
|
s.removeTask(task.TaskId)
|
2024-08-26 13:42:42 +00:00
|
|
|
span.AddEvent("Removed task", trace.WithAttributes(attribute.String("task_id", task.TaskId)))
|
2024-07-19 13:28:48 +00:00
|
|
|
|
2024-08-26 13:42:42 +00:00
|
|
|
log.WithContext(ctx).WithFields(log.Fields{
|
|
|
|
"task_id": task.TaskId,
|
|
|
|
"task_state": plugTaskState.TaskState,
|
|
|
|
}).Info("Task cancellation requested")
|
|
|
|
|
|
|
|
span.SetAttributes(attribute.String("task_id", task.TaskId))
|
2024-07-19 13:28:48 +00:00
|
|
|
return &plugTaskState, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (s *server) removeTask(taskID string) {
|
|
|
|
fn, exists := s.ctx[taskID]
|
|
|
|
if !exists {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
fn()
|
|
|
|
delete(s.ctx, taskID)
|
|
|
|
}
|