X-Git-Url: https://gerrit.o-ran-sc.org/r/gitweb?a=blobdiff_plain;f=dmaap-mediator-producer%2Finternal%2Fjobs%2Fjobs.go;h=0bf2f12a06d709ce4d445963078f7737e82cdcaf;hb=db7b5c801bdc96889aea18ab190f2b72fa8d8e06;hp=10eaf680ff3b4c1050c72d606d39cb07ee7c870d;hpb=63a42cacf9c52b7dff64431a3354f55c49bd6e4b;p=nonrtric.git diff --git a/dmaap-mediator-producer/internal/jobs/jobs.go b/dmaap-mediator-producer/internal/jobs/jobs.go index 10eaf680..0bf2f12a 100644 --- a/dmaap-mediator-producer/internal/jobs/jobs.go +++ b/dmaap-mediator-producer/internal/jobs/jobs.go @@ -21,102 +21,426 @@ package jobs import ( - "os" - "path/filepath" + "fmt" "strings" + "sync" + "time" + + "github.com/confluentinc/confluent-kafka-go/kafka" + log "github.com/sirupsen/logrus" + "oransc.org/nonrtric/dmaapmediatorproducer/internal/config" + "oransc.org/nonrtric/dmaapmediatorproducer/internal/kafkaclient" + "oransc.org/nonrtric/dmaapmediatorproducer/internal/restclient" ) -type Type struct { - TypeId string - Schema string +type TypeData struct { + Identity string `json:"id"` + jobsHandler *jobsHandler } +type sourceType string + +const dMaaPSource = sourceType("dmaap") +const kafkaSource = sourceType("kafka") + type JobInfo struct { - Owner string `json:"owner"` - LastUpdated string `json:"last_updated"` - InfoJobIdentity string `json:"info_job_identity"` - TargetUri string `json:"target_uri"` - InfoJobData string `json:"info_job_data"` - InfoTypeIdentity string `json:"info_type_identity"` + Owner string `json:"owner"` + LastUpdated string `json:"last_updated"` + InfoJobIdentity string `json:"info_job_identity"` + TargetUri string `json:"target_uri"` + InfoJobData Parameters `json:"info_job_data"` + InfoTypeIdentity string `json:"info_type_identity"` + sourceType sourceType } -type JobHandler interface { - AddJob(JobInfo) error +type JobTypesManager interface { + LoadTypesFromConfiguration(types []config.TypeDefinition) []config.TypeDefinition + GetSupportedTypes() []string } -var ( - typeDir = "configs" - Handler JobHandler - allJobs = make(map[string]map[string]JobInfo) -) +type JobsManager interface { + AddJobFromRESTCall(JobInfo) error + DeleteJobFromRESTCall(jobId string) +} -func init() { - Handler = newJobHandlerImpl() +type JobsManagerImpl struct { + allTypes map[string]TypeData + pollClient restclient.HTTPClient + mrAddress string + kafkaFactory kafkaclient.KafkaFactory + distributeClient restclient.HTTPClient } -type jobHandlerImpl struct{} +func NewJobsManagerImpl(pollClient restclient.HTTPClient, mrAddr string, kafkaFactory kafkaclient.KafkaFactory, distributeClient restclient.HTTPClient) *JobsManagerImpl { + return &JobsManagerImpl{ + allTypes: make(map[string]TypeData), + pollClient: pollClient, + mrAddress: mrAddr, + kafkaFactory: kafkaFactory, + distributeClient: distributeClient, + } +} -func newJobHandlerImpl() *jobHandlerImpl { - return &jobHandlerImpl{} +func (jm *JobsManagerImpl) AddJobFromRESTCall(ji JobInfo) error { + if err := jm.validateJobInfo(ji); err == nil { + typeData := jm.allTypes[ji.InfoTypeIdentity] + ji.sourceType = typeData.jobsHandler.sourceType + typeData.jobsHandler.addJobCh <- ji + log.Debug("Added job: ", ji) + return nil + } else { + return err + } } -func (jh *jobHandlerImpl) AddJob(ji JobInfo) error { - if jobs, ok := allJobs[ji.InfoTypeIdentity]; ok { - if _, ok := jobs[ji.InfoJobIdentity]; ok { - // TODO: Update job - } else { - jobs[ji.InfoJobIdentity] = ji - } +func (jm *JobsManagerImpl) DeleteJobFromRESTCall(jobId string) { + for _, typeData := range jm.allTypes { + log.Debugf("Deleting job %v from type %v", jobId, typeData.Identity) + typeData.jobsHandler.deleteJobCh <- jobId + } + log.Debug("Deleted job: ", jobId) +} + +func (jm *JobsManagerImpl) validateJobInfo(ji JobInfo) error { + if _, ok := jm.allTypes[ji.InfoTypeIdentity]; !ok { + return fmt.Errorf("type not supported: %v", ji.InfoTypeIdentity) + } + if ji.InfoJobIdentity == "" { + return fmt.Errorf("missing required job identity: %v", ji) + } + // Temporary for when there are only REST callbacks needed + if ji.TargetUri == "" { + return fmt.Errorf("missing required target URI: %v", ji) } return nil } -func GetTypes() ([]*Type, error) { - types := make([]*Type, 0, 1) - err := filepath.Walk(typeDir, - func(path string, info os.FileInfo, err error) error { - if err != nil { - return err - } - if strings.Contains(path, ".json") { - if jobType, err := getType(path); err == nil { - types = append(types, jobType) - } - } - return nil - }) - if err != nil { - return nil, err +func (jm *JobsManagerImpl) LoadTypesFromConfiguration(types []config.TypeDefinition) []config.TypeDefinition { + for _, typeDef := range types { + if typeDef.DMaaPTopicURL == "" && typeDef.KafkaInputTopic == "" { + log.Fatal("DMaaPTopicURL or KafkaInputTopic must be defined for type: ", typeDef.Identity) + } + jm.allTypes[typeDef.Identity] = TypeData{ + Identity: typeDef.Identity, + jobsHandler: newJobsHandler(typeDef, jm.mrAddress, jm.kafkaFactory, jm.pollClient, jm.distributeClient), + } } - return types, nil + return types } -func GetSupportedTypes() []string { +func (jm *JobsManagerImpl) GetSupportedTypes() []string { supportedTypes := []string{} - for k := range allJobs { + for k := range jm.allTypes { supportedTypes = append(supportedTypes, k) } return supportedTypes } -func AddJob(job JobInfo) error { - return Handler.AddJob(job) +func (jm *JobsManagerImpl) StartJobsForAllTypes() { + for _, jobType := range jm.allTypes { + + go jobType.jobsHandler.startPollingAndDistribution() + + } +} + +type jobsHandler struct { + mu sync.Mutex + typeId string + sourceType sourceType + pollingAgent pollingAgent + jobs map[string]job + addJobCh chan JobInfo + deleteJobCh chan string + distributeClient restclient.HTTPClient } -func getType(path string) (*Type, error) { - fileName := filepath.Base(path) - typeName := strings.TrimSuffix(fileName, filepath.Ext(fileName)) +func newJobsHandler(typeDef config.TypeDefinition, mRAddress string, kafkaFactory kafkaclient.KafkaFactory, pollClient restclient.HTTPClient, distributeClient restclient.HTTPClient) *jobsHandler { + pollingAgent := createPollingAgent(typeDef, mRAddress, pollClient, kafkaFactory, typeDef.KafkaInputTopic) + sourceType := kafkaSource + if typeDef.DMaaPTopicURL != "" { + sourceType = dMaaPSource + } + return &jobsHandler{ + typeId: typeDef.Identity, + sourceType: sourceType, + pollingAgent: pollingAgent, + jobs: make(map[string]job), + addJobCh: make(chan JobInfo), + deleteJobCh: make(chan string), + distributeClient: distributeClient, + } +} - if typeSchema, err := os.ReadFile(path); err == nil { - typeInfo := Type{ - TypeId: typeName, - Schema: string(typeSchema), +func (jh *jobsHandler) startPollingAndDistribution() { + go func() { + for { + jh.pollAndDistributeMessages() } - if _, ok := allJobs[typeName]; !ok { - allJobs[typeName] = make(map[string]JobInfo) + }() + + go func() { + for { + jh.monitorManagementChannels() + } + }() +} + +func (jh *jobsHandler) pollAndDistributeMessages() { + log.Debugf("Processing jobs for type: %v", jh.typeId) + messagesBody, error := jh.pollingAgent.pollMessages() + if error != nil { + log.Warn("Error getting data from source. Cause: ", error) + time.Sleep(time.Minute) // Must wait before trying to call data source again + return + } + jh.distributeMessages(messagesBody) +} + +func (jh *jobsHandler) distributeMessages(messages []byte) { + if string(messages) != "[]" && len(messages) > 0 { // MR returns an ampty array if there are no messages. + log.Debug("Distributing messages: ", string(messages)) + jh.mu.Lock() + defer jh.mu.Unlock() + for _, job := range jh.jobs { + if len(job.messagesChannel) < cap(job.messagesChannel) { + job.messagesChannel <- messages + } else { + jh.emptyMessagesBuffer(job) + } + } + } +} + +func (jh *jobsHandler) emptyMessagesBuffer(job job) { + log.Debug("Emptying message queue for job: ", job.jobInfo.InfoJobIdentity) +out: + for { + select { + case <-job.messagesChannel: + default: + break out + } + } +} + +func (jh *jobsHandler) monitorManagementChannels() { + select { + case addedJob := <-jh.addJobCh: + jh.addJob(addedJob) + case deletedJob := <-jh.deleteJobCh: + jh.deleteJob(deletedJob) + } +} + +func (jh *jobsHandler) addJob(addedJob JobInfo) { + jh.mu.Lock() + log.Debug("Add job: ", addedJob) + newJob := newJob(addedJob, jh.distributeClient) + go newJob.start() + jh.jobs[addedJob.InfoJobIdentity] = newJob + jh.mu.Unlock() +} + +func (jh *jobsHandler) deleteJob(deletedJob string) { + jh.mu.Lock() + log.Debug("Delete job: ", deletedJob) + j, exist := jh.jobs[deletedJob] + if exist { + j.controlChannel <- struct{}{} + delete(jh.jobs, deletedJob) + } + jh.mu.Unlock() +} + +type pollingAgent interface { + pollMessages() ([]byte, error) +} + +func createPollingAgent(typeDef config.TypeDefinition, mRAddress string, pollClient restclient.HTTPClient, kafkaFactory kafkaclient.KafkaFactory, topicID string) pollingAgent { + if typeDef.DMaaPTopicURL != "" { + return dMaaPPollingAgent{ + messageRouterURL: mRAddress + typeDef.DMaaPTopicURL, + pollClient: pollClient, } - return &typeInfo, nil } else { + return newKafkaPollingAgent(kafkaFactory, typeDef.KafkaInputTopic) + } +} + +type dMaaPPollingAgent struct { + messageRouterURL string + pollClient restclient.HTTPClient +} + +func (pa dMaaPPollingAgent) pollMessages() ([]byte, error) { + return restclient.Get(pa.messageRouterURL, pa.pollClient) +} + +type kafkaPollingAgent struct { + kafkaClient kafkaclient.KafkaClient +} + +func newKafkaPollingAgent(kafkaFactory kafkaclient.KafkaFactory, topicID string) kafkaPollingAgent { + c, err := kafkaclient.NewKafkaClient(kafkaFactory, topicID) + if err != nil { + log.Fatalf("Cannot create Kafka client for topic: %v, error details: %v\n", topicID, err) + } + return kafkaPollingAgent{ + kafkaClient: c, + } +} + +func (pa kafkaPollingAgent) pollMessages() ([]byte, error) { + msg, err := pa.kafkaClient.ReadMessage() + if err == nil { + return msg, nil + } else { + if isKafkaTimedOutError(err) { + return []byte(""), nil + } return nil, err } } + +func isKafkaTimedOutError(err error) bool { + kafkaErr, ok := err.(kafka.Error) + return ok && kafkaErr.Code() == kafka.ErrTimedOut +} + +type job struct { + jobInfo JobInfo + client restclient.HTTPClient + messagesChannel chan []byte + controlChannel chan struct{} +} + +func newJob(j JobInfo, c restclient.HTTPClient) job { + + return job{ + jobInfo: j, + client: c, + messagesChannel: make(chan []byte, 10), + controlChannel: make(chan struct{}), + } +} + +type Parameters struct { + BufferTimeout BufferTimeout `json:"bufferTimeout"` +} + +type BufferTimeout struct { + MaxSize int `json:"maxSize"` + MaxTimeMiliseconds int64 `json:"maxTimeMiliseconds"` +} + +func (j *job) start() { + if j.isJobBuffered() { + j.startReadingMessagesBuffered() + } else { + j.startReadingSingleMessages() + } +} + +func (j *job) startReadingSingleMessages() { +out: + for { + select { + case <-j.controlChannel: + log.Debug("Stop distribution for job: ", j.jobInfo.InfoJobIdentity) + break out + case msg := <-j.messagesChannel: + j.sendMessagesToConsumer(msg) + } + } +} + +func (j *job) startReadingMessagesBuffered() { +out: + for { + select { + case <-j.controlChannel: + log.Debug("Stop distribution for job: ", j.jobInfo.InfoJobIdentity) + break out + default: + msgs := j.read(j.jobInfo.InfoJobData.BufferTimeout) + if len(msgs) > 0 { + j.sendMessagesToConsumer(msgs) + } + } + } +} + +func (j *job) read(bufferParams BufferTimeout) []byte { + wg := sync.WaitGroup{} + wg.Add(bufferParams.MaxSize) + rawMsgs := make([][]byte, 0, bufferParams.MaxSize) + c := make(chan struct{}) + go func() { + i := 0 + out: + for { + select { + case <-c: + break out + case msg := <-j.messagesChannel: + rawMsgs = append(rawMsgs, msg) + i++ + wg.Done() + if i == bufferParams.MaxSize { + break out + } + } + } + }() + j.waitTimeout(&wg, time.Duration(bufferParams.MaxTimeMiliseconds)*time.Millisecond) + close(c) + return getAsJSONArray(rawMsgs) +} + +func getAsJSONArray(rawMsgs [][]byte) []byte { + json := `"[` + for i := 0; i < len(rawMsgs); i++ { + msg := string(rawMsgs[i]) + json = json + strings.ReplaceAll(msg, "\"", "\\\"") + if i < len(rawMsgs)-1 { + json = json + "," + } + } + return []byte(json + `]"`) +} + +func (j *job) waitTimeout(wg *sync.WaitGroup, timeout time.Duration) bool { + c := make(chan struct{}) + go func() { + defer close(c) + wg.Wait() + }() + select { + case <-c: + return false // completed normally + case <-time.After(timeout): + return true // timed out + } +} + +func (j *job) sendMessagesToConsumer(messages []byte) { + log.Debug("Processing job: ", j.jobInfo.InfoJobIdentity) + contentType := restclient.ContentTypeJSON + if j.isJobKafka() && !j.isJobBuffered() { + contentType = restclient.ContentTypePlain + } + if postErr := restclient.Post(j.jobInfo.TargetUri, messages, contentType, j.client); postErr != nil { + log.Warnf("Error posting data for job: %v. Cause: %v", j.jobInfo, postErr) + return + } + log.Debugf("Messages for job: %v distributed to consumer: %v", j.jobInfo.InfoJobIdentity, j.jobInfo.Owner) +} + +func (j *job) isJobBuffered() bool { + return j.jobInfo.InfoJobData.BufferTimeout.MaxSize > 0 && j.jobInfo.InfoJobData.BufferTimeout.MaxTimeMiliseconds > 0 +} + +func (j *job) isJobKafka() bool { + return j.jobInfo.sourceType == kafkaSource +}