X-Git-Url: https://gerrit.o-ran-sc.org/r/gitweb?a=blobdiff_plain;f=include%2Fhfta%2Frunning_gb_operator.h;h=c20c87f64ae6f88da743e3e26da586f36f478eaa;hb=7cec316889150a8a92238e52c7bad1270608b333;hp=0762c639cb659dd988cb30e452fe144e3a3ee6a5;hpb=07495effe193ca3f73c3bf0ce417068f9ac9dcdd;p=com%2Fgs-lite.git

diff --git a/include/hfta/running_gb_operator.h b/include/hfta/running_gb_operator.h
index 0762c63..c20c87f 100644
--- a/include/hfta/running_gb_operator.h
+++ b/include/hfta/running_gb_operator.h
@@ -1,141 +1,154 @@
-/* ------------------------------------------------
-Copyright 2014 AT&T Intellectual Property
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
- ------------------------------------------- */
-
-#ifndef RWGROUPBY_OPERATOR_H
-#define RWGROUPBY_OPERATOR_H
-
-#include "host_tuple.h"
-#include "base_operator.h"
-#include <list>
-#include "hash_table.h"
-
-#define _GB_FLUSH_PER_TUPLE_ 1
-
-using namespace std;
-
-template <class groupby_func, class group, class aggregate, class hasher_func, class equal_func>
-class running_agg_operator : public base_operator {
-private :
-	groupby_func func;
-	hash_table<group*, aggregate*, hasher_func, equal_func> group_table;
-	typename hash_table<group*, aggregate*, hasher_func, equal_func>::iterator flush_pos;
-
-
-
-public:
-	running_agg_operator(int schema_handle, const char* name) : base_operator(name), func(schema_handle) {
-		flush_pos = group_table.end();
-	}
-
-	virtual int accept_tuple(host_tuple& tup, list<host_tuple>& result) {
-
-//			Push out completed groups
-
-		// create buffer on the stack to store key object
-		char buffer[sizeof(group)];
-
-		// extract the key information from the tuple and
-		// copy it into buffer
-		group* grp = func.create_group(tup, buffer);
-/*//			Ignore temp tuples until we can fix their timestamps.
-if (func.temp_status_received()) {
- tup.free_tuple();
- return 0;
-}
-*/
-
-		if (!grp) {
-			if (func.flush_needed()){
-				flush(result);
-			}
-			if (func.temp_status_received()) {
-				host_tuple temp_tup;
-				if (!func.create_temp_status_tuple(temp_tup, true)) {
-					temp_tup.channel = output_channel;
-					result.push_back(temp_tup);
-				}
-			}
-			tup.free_tuple();
-			return 0;
-		}
-
-		if (func.flush_needed()) {
-			flush(result);
-		}
-		typename hash_table<group*, aggregate*, hasher_func, equal_func>::iterator iter;
-		if ((iter = group_table.find(grp)) != group_table.end()) {
-			aggregate* old_aggr = (*iter).second;
-			func.update_aggregate(tup, grp, old_aggr);
-		}else{
-			// create a copy of the group on the heap
-			group* new_grp = new group(grp);	// need a copy constructor for groups
-//			aggregate* aggr = (aggregate*)malloc(sizeof(aggregate));
-			aggregate* aggr = new aggregate();
-			// create an aggregate in preallocated buffer
-			aggr = func.create_aggregate(tup, (char*)aggr);
-
-			group_table.insert(new_grp, aggr);
-		}
-		tup.free_tuple();
-		return 0;
-	}
-
-	virtual int flush(list<host_tuple>& result) {
-		host_tuple tup;
-		typename hash_table<group*, aggregate*, hasher_func, equal_func>::iterator iter;
-//		If the old table isn't empty, flush it now.
-		for (flush_pos = group_table.begin(); flush_pos != group_table.end(); ) {
-			bool failed = false;
-			tup = func.create_output_tuple((*flush_pos).first,(*flush_pos).second, failed);
-			if (!failed) {
-				tup.channel = output_channel;
-				result.push_back(tup);
-			}
-			if(func.cleaning_when((*flush_pos).first,(*flush_pos).second)){
-			    group* g = (*flush_pos).first;
-		    	aggregate* a = (*flush_pos).second;
-				++flush_pos;
-				group_table.erase(g);
-				delete (g);
-				delete (a);
-			}else{
-				func.reinit_aggregates((*flush_pos).first, (*flush_pos).second);
-				++flush_pos;
-			}
-		}
-
-		return 0;
-	}
-
-	virtual int set_param_block(int sz, void * value) {
-		func.set_param_block(sz, value);
-		return 0;
-	}
-
-	virtual int get_temp_status(host_tuple& result) {
-		result.channel = output_channel;
-		return func.create_temp_status_tuple(result, true);
-	}
-
-	virtual int get_blocked_status () {
-		return -1;
-	}
-
-	unsigned int get_mem_footprint() {
-		return group_table.get_mem_footprint();
-	}
-};
-
-#endif	// GROUPBY_OPERATOR_H
+/* ------------------------------------------------
+Copyright 2014 AT&T Intellectual Property
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
+ ------------------------------------------- */
+
+#ifndef RWGROUPBY_OPERATOR_H
+#define RWGROUPBY_OPERATOR_H
+
+#include "host_tuple.h"
+#include "base_operator.h"
+#include <list>
+#include "hash_table.h"
+
+#define _GB_FLUSH_PER_TUPLE_ 1
+
+using namespace std;
+
+template <class groupby_func, class group, class aggregate, class hasher_func, class equal_func>
+class running_agg_operator : public base_operator {
+private :
+	groupby_func func;
+	hash_table<group*, aggregate*, hasher_func, equal_func> group_table;
+	typename hash_table<group*, aggregate*, hasher_func, equal_func>::iterator flush_pos;
+	gs_int32_t nflushes;
+
+
+
+public:
+	running_agg_operator(int schema_handle, const char* name) : base_operator(name), func(schema_handle) {
+		flush_pos = group_table.end();
+	}
+
+	virtual int accept_tuple(host_tuple& tup, list<host_tuple>& result) {
+
+//			Push out completed groups
+
+// create buffer on the stack to store key object
+		char buffer[sizeof(group)];
+//	Number of flushes required
+
+// extract the key information from the tuple and
+// copy it into buffer
+		group* grp = func.create_group(tup, buffer);
+		nflushes = func.flush_needed();
+		
+		if (!grp) {
+			if (nflushes>0){
+				flush(result);
+			}
+			if (func.temp_status_received()) {
+				host_tuple temp_tup;
+				if (!func.create_temp_status_tuple(temp_tup, true)) {
+					temp_tup.channel = output_channel;
+					result.push_back(temp_tup);
+				}
+			}
+			tup.free_tuple();
+			return 0;
+		}
+
+		if (nflushes>0) {
+			flush(result);
+		}
+		typename hash_table<group*, aggregate*, hasher_func, equal_func>::iterator iter;
+		if ((iter = group_table.find(grp)) != group_table.end()) {
+			aggregate* old_aggr = (*iter).second;
+			func.update_aggregate(tup, grp, old_aggr);
+		}else{
+			// create a copy of the group on the heap
+			group* new_grp = new group(grp);	// need a copy constructor for groups
+//			aggregate* aggr = (aggregate*)malloc(sizeof(aggregate));
+			aggregate* aggr = new aggregate();
+			// create an aggregate in preallocated buffer
+			aggr = func.create_aggregate(tup, (char*)aggr);
+
+			group_table.insert(new_grp, aggr);
+		}
+		tup.free_tuple();
+		return 0;
+	}
+
+	virtual int flush(list<host_tuple>& result) {
+		host_tuple tup;
+		typename hash_table<group*, aggregate*, hasher_func, equal_func>::iterator iter;
+
+//	Limit the number of successive flushes - avoid explosive behavior
+		const gs_int32_t max_flushes = 10;
+		if(nflushes>max_flushes){
+			fprintf(stderr,"Warning in operator %s, temporal advance of %d windows needed, max number of windows that can be reported at once is %d\n",op_name, nflushes, max_flushes);
+			nflushes = max_flushes;
+		}
+
+		for(gs_int32_t flush_no = 0; flush_no < nflushes; ++flush_no){
+//	advance the TB for the reinit
+			if(flush_no < nflushes-1){
+				func.advance_last_tb();
+			}else{
+				func.reset_last_tb();	// Move to current tb in case flush limit reached
+			}
+//		If the old table isn't empty, flush it now.
+			for (flush_pos = group_table.begin(); flush_pos != group_table.end(); ) {
+				bool failed = false;
+				tup = func.create_output_tuple((*flush_pos).first,(*flush_pos).second, failed);
+				if (!failed) {
+					tup.channel = output_channel;
+					result.push_back(tup);
+				}
+				if(func.cleaning_when((*flush_pos).first,(*flush_pos).second)){
+			    	group* g = (*flush_pos).first;
+		    		aggregate* a = (*flush_pos).second;
+					++flush_pos;
+					group_table.erase(g);
+					delete (g);
+					delete (a);
+				}else{
+					func.reinit_aggregates((*flush_pos).first, (*flush_pos).second);
+					++flush_pos;
+				}
+			}
+		}
+
+		return 0;
+	}
+
+	virtual int set_param_block(int sz, void * value) {
+		func.set_param_block(sz, value);
+		return 0;
+	}
+
+	virtual int get_temp_status(host_tuple& result) {
+		result.channel = output_channel;
+		return func.create_temp_status_tuple(result, true);
+	}
+
+	virtual int get_blocked_status () {
+		return -1;
+	}
+
+	unsigned int get_mem_footprint() {
+		return group_table.get_mem_footprint();
+	}
+};
+
+#endif	// GROUPBY_OPERATOR_H