3 // ========================LICENSE_START=================================
6 // Copyright (C) 2023: Nordix Foundation
8 // Licensed under the Apache License, Version 2.0 (the "License");
9 // you may not use this file except in compliance with the License.
10 // You may obtain a copy of the License at
12 // http://www.apache.org/licenses/LICENSE-2.0
14 // Unless required by applicable law or agreed to in writing, software
15 // distributed under the License is distributed on an "AS IS" BASIS,
16 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17 // See the License for the specific language governing permissions and
18 // limitations under the License.
19 // ========================LICENSE_END===================================
20 package kafkacollector
25 "github.com/confluentinc/confluent-kafka-go/kafka"
26 jsoniter "github.com/json-iterator/go"
27 log "github.com/sirupsen/logrus"
28 "golang.org/x/oauth2/clientcredentials"
29 "main/common/dataTypes"
30 "main/components/miniocollector"
35 var creds_grant_type = os.Getenv("CREDS_GRANT_TYPE")
36 var bootstrapserver = os.Getenv("KAFKA_SERVER")
37 var creds_client_secret = os.Getenv("CREDS_CLIENT_SECRET")
38 var creds_client_id = os.Getenv("CREDS_CLIENT_ID")
39 var creds_service_url = os.Getenv("AUTH_SERVICE_URL")
41 // Limiter - valid for all jobs
42 const parallelism_limiter = 100 //For all jobs
43 var jobLimiterChan = make(chan struct{}, parallelism_limiter)
45 func Start_topic_reader(topic string, type_id string, control_ch chan dataTypes.ReaderControl, data_ch chan *dataTypes.KafkaPayload, gid string, cid string) {
47 log.Info("Topic reader starting, topic: ", topic, " for type: ", type_id)
50 var c *kafka.Consumer = nil
53 for topic_ok == false {
56 case reader_ctrl := <-control_ch:
57 if reader_ctrl.Command == "EXIT" {
58 log.Info("Topic reader on topic: ", topic, " for type: ", type_id, " - stopped")
59 data_ch <- nil //Signal to job handler
63 case <-time.After(1 * time.Second):
68 c = create_kafka_consumer(type_id, gid, cid)
70 log.Info("Cannot start consumer on topic: ", topic, " for type: ", type_id, " - retrying")
72 log.Info("Consumer started on topic: ", topic, " for type: ", type_id)
75 if c != nil && topic_ok == false {
76 err := c.SubscribeTopics([]string{topic}, nil)
78 log.Info("Topic reader cannot start subscribing on topic: ", topic, " for type: ", type_id, " - retrying -- error details: ", err)
80 log.Info("Topic reader subscribing on topic: ", topic, " for type: ", type_id)
86 log.Info("Topic reader ready on topic: ", topic, " for type: ", type_id)
88 var event_chan = make(chan int)
92 case evt := <-c.Events():
94 case kafka.OAuthBearerTokenRefresh:
95 log.Debug("New consumer token needed: ", evt)
96 token, err := Fetch_token()
98 log.Warning("Cannot cannot fetch token: ", err)
99 c.SetOAuthBearerTokenFailure(err.Error())
101 setTokenError := c.SetOAuthBearerToken(*token)
102 if setTokenError != nil {
103 log.Warning("Cannot cannot set token: ", setTokenError)
104 c.SetOAuthBearerTokenFailure(setTokenError.Error())
108 log.Debug("Dumping topic reader event on topic: ", topic, " for type: ", type_id, " evt: ", evt.String())
111 case msg := <-event_chan:
115 case <-time.After(1 * time.Second):
127 case reader_ctrl := <-control_ch:
128 if reader_ctrl.Command == "EXIT" {
130 log.Debug("Topic reader on topic: ", topic, " for type: ", type_id, " - stopped")
131 data_ch <- nil //Signal to job handler
139 log.Debug("Topic Reader for type: ", type_id, " Nothing to consume on topic: ", topic)
142 switch e := ev.(type) {
144 var kmsg dataTypes.KafkaPayload
150 log.Debug("Reader msg: ", &kmsg)
151 log.Debug("Reader - data_ch ", data_ch)
153 fmt.Fprintf(os.Stderr, "%% Error: %v: %v\n", e.Code(), e)
155 case kafka.OAuthBearerTokenRefresh:
156 log.Debug("New consumer token needed: ", ev)
157 token, err := Fetch_token()
159 log.Warning("Cannot cannot fetch token: ", err)
160 c.SetOAuthBearerTokenFailure(err.Error())
162 setTokenError := c.SetOAuthBearerToken(*token)
163 if setTokenError != nil {
164 log.Warning("Cannot cannot set token: ", setTokenError)
165 c.SetOAuthBearerTokenFailure(setTokenError.Error())
169 fmt.Printf("Ignored %v\n", e)
177 func Start_topic_writer(control_ch chan dataTypes.WriterControl, data_ch chan *dataTypes.KafkaPayload) {
179 var kafka_producer *kafka.Producer
182 log.Info("Topic writer starting")
184 // Wait for kafka producer to become available - and be prepared to exit the writer
185 for kafka_producer == nil {
187 case writer_ctl := <-control_ch:
188 if writer_ctl.Command == "EXIT" {
192 kafka_producer = start_producer()
193 if kafka_producer == nil {
194 log.Debug("Could not start kafka producer - retrying")
195 time.Sleep(1 * time.Second)
197 log.Debug("Kafka producer started")
202 var event_chan = make(chan int)
206 case evt := <-kafka_producer.Events():
209 m := evt.(*kafka.Message)
211 if m.TopicPartition.Error != nil {
212 log.Debug("Dumping topic writer event, failed: ", m.TopicPartition.Error)
214 log.Debug("Dumping topic writer event, message to topic: ", *m.TopicPartition.Topic, " at offset: ", m.TopicPartition.Offset, " at partition: ", m.TopicPartition.Partition)
217 log.Debug("Dumping topic writer event, error: ", evt)
218 case kafka.OAuthBearerTokenRefresh:
219 log.Debug("New producer token needed: ", evt)
220 token, err := Fetch_token()
222 log.Warning("Cannot cannot fetch token: ", err)
223 kafka_producer.SetOAuthBearerTokenFailure(err.Error())
225 setTokenError := kafka_producer.SetOAuthBearerToken(*token)
226 if setTokenError != nil {
227 log.Warning("Cannot cannot set token: ", setTokenError)
228 kafka_producer.SetOAuthBearerTokenFailure(setTokenError.Error())
232 log.Debug("Dumping topic writer event, unknown: ", evt)
235 case msg := <-event_chan:
239 case <-time.After(1 * time.Second):
249 case writer_ctl := <-control_ch:
250 if writer_ctl.Command == "EXIT" {
251 // ignore - wait for channel signal
254 case kmsg := <-data_ch:
257 log.Info("Topic writer stopped by channel signal - start_topic_writer")
258 defer kafka_producer.Close()
265 for retry := 1; retry <= retries && msg_ok == false; retry++ {
266 err = kafka_producer.Produce(&kafka.Message{
267 TopicPartition: kafka.TopicPartition{Topic: &kmsg.Topic, Partition: kafka.PartitionAny},
268 Value: kmsg.Msg.Value, Key: kmsg.Msg.Key}, nil)
272 log.Debug("Topic writer, msg sent ok on topic: ", kmsg.Topic)
274 log.Info("Topic writer failed to send message on topic: ", kmsg.Topic, " - Retrying. Error details: ", err)
275 time.Sleep(time.Duration(retry) * time.Second)
279 log.Error("Topic writer failed to send message on topic: ", kmsg.Topic, " - Msg discarded. Error details: ", err)
281 case <-time.After(1000 * time.Millisecond):
290 func create_kafka_consumer(type_id string, gid string, cid string) *kafka.Consumer {
291 var cm kafka.ConfigMap
292 if creds_grant_type == "" {
293 log.Info("Creating kafka plain text consumer for type: ", type_id)
294 cm = kafka.ConfigMap{
295 "bootstrap.servers": bootstrapserver,
298 "auto.offset.reset": "latest",
299 "enable.auto.commit": false,
302 log.Info("Creating kafka SASL plain text consumer for type: ", type_id)
303 cm = kafka.ConfigMap{
304 "bootstrap.servers": bootstrapserver,
307 "auto.offset.reset": "latest",
308 "enable.auto.commit": false,
309 "sasl.mechanism": "OAUTHBEARER",
310 "security.protocol": "SASL_PLAINTEXT",
313 c, err := kafka.NewConsumer(&cm)
316 log.Error("Cannot create kafka consumer for type: ", type_id, ", error details: ", err)
320 log.Info("Created kafka consumer for type: ", type_id, " OK")
324 // Start kafka producer
325 func start_producer() *kafka.Producer {
326 log.Info("Creating kafka producer")
328 var cm kafka.ConfigMap
329 if creds_grant_type == "" {
330 log.Info("Creating kafka SASL plain text producer")
331 cm = kafka.ConfigMap{
332 "bootstrap.servers": bootstrapserver,
335 log.Info("Creating kafka SASL plain text producer")
336 cm = kafka.ConfigMap{
337 "bootstrap.servers": bootstrapserver,
338 "sasl.mechanism": "OAUTHBEARER",
339 "security.protocol": "SASL_PLAINTEXT",
343 p, err := kafka.NewProducer(&cm)
345 log.Error("Cannot create kafka producer,", err)
351 func Start_job_xml_file_data(type_id string, control_ch chan dataTypes.JobControl, data_in_ch chan *dataTypes.KafkaPayload, data_out_channel chan *dataTypes.KafkaPayload, fvolume string, fsbucket string) {
353 log.Info("Type job", type_id, " started")
354 topic_list := make(map[string]string)
355 topic_list[type_id] = "json-file-ready-kp"
356 topic_list["PmData"] = "json-file-ready-kpadp"
360 case job_ctl := <-control_ch:
361 log.Debug("Type job ", type_id, " new cmd received ", job_ctl.Command)
362 switch job_ctl.Command {
364 //ignore cmd - handled by channel signal
367 case msg := <-data_in_ch:
369 log.Info("Type job ", type_id, " stopped by channel signal - start_job_xml_file_data")
374 jobLimiterChan <- struct{}{}
375 go run_xml_job(type_id, msg, "gz", data_out_channel, topic_list, jobLimiterChan, fvolume, fsbucket)
377 case <-time.After(1 * time.Second):
385 func run_xml_job(type_id string, msg *dataTypes.KafkaPayload, outputCompression string, data_out_channel chan *dataTypes.KafkaPayload, topic_list map[string]string, jobLimiterChan chan struct{}, fvolume string, fsbucket string) {
390 var evt_data dataTypes.XmlFileEventHeader
392 err := jsoniter.Unmarshal(msg.Msg.Value, &evt_data)
394 log.Error("Cannot parse XmlFileEventHeader for type job: ", type_id, " - discarding message, error details", err)
397 log.Debug("Unmarshal file-collect event for type job: ", type_id, " time: ", time.Since(start).String())
400 new_fn := miniocollector.Xml_to_json_conv(&evt_data)
402 log.Error("Cannot convert file ", evt_data.Name, " - discarding message, ", err)
405 log.Debug("Converted file to json: ", new_fn, " time", time.Since(start).String())
407 var fde dataTypes.FileDownloadedEvt
408 fde.Filename = new_fn
409 j, err := jsoniter.Marshal(fde)
412 log.Error("Cannot marshal FileDownloadedEvt - discarding message, ", err)
417 msg.Msg.Key = []byte("\"" + evt_data.SourceName + "\"")
418 log.Debug("Marshal file-collect event ", time.Since(start).String())
419 log.Debug("Sending file-collect event to output topic(s)", len(topic_list))
420 for _, v := range topic_list {
421 fmt.Println("Output Topic: " + v)
422 var kmsg *dataTypes.KafkaPayload = new(dataTypes.KafkaPayload)
425 data_out_channel <- kmsg
429 func Fetch_token() (*kafka.OAuthBearerToken, error) {
430 log.Debug("Get token inline")
431 conf := &clientcredentials.Config{
432 ClientID: creds_client_id,
433 ClientSecret: creds_client_secret,
434 TokenURL: creds_service_url,
436 token, err := conf.Token(context.Background())
438 log.Warning("Cannot fetch access token: ", err)
441 extensions := map[string]string{}
442 log.Debug("=====================================================")
443 log.Debug("token: ", token)
444 log.Debug("=====================================================")
445 log.Debug("TokenValue: ", token.AccessToken)
446 log.Debug("=====================================================")
447 log.Debug("Expiration: ", token.Expiry)
449 oauthBearerToken := kafka.OAuthBearerToken{
450 TokenValue: token.AccessToken,
452 Extensions: extensions,
455 return &oauthBearerToken, nil