From: rajdeep11 Date: Wed, 19 Feb 2025 05:42:49 +0000 (+0530) Subject: pipeline code placed in the samples folder X-Git-Url: https://gerrit.o-ran-sc.org/r/gitweb?a=commitdiff_plain;h=84fb406bb38393775cea4592ef772b9ed2571d28;p=aiml-fw%2Faimlfw-dep.git pipeline code placed in the samples folder Change-Id: I5db915e280616efab9a34568ed5aeb57a644b277 Signed-off-by: rajdeep11 --- diff --git a/samples/qoe/qoe_pipeline_k_release.py b/samples/qoe/qoe_pipeline_k_release.py new file mode 100644 index 0000000..5f8fc6d --- /dev/null +++ b/samples/qoe/qoe_pipeline_k_release.py @@ -0,0 +1,132 @@ +# ================================================================================== +# +# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# +# ================================================================================== + +import kfp +import kfp.dsl as dsl +from kfp.dsl import InputPath, OutputPath +from kfp.dsl import component as component +from kfp import kubernetes + +BASE_IMAGE = "traininghost/pipelineimage:latest" + +@component(base_image=BASE_IMAGE) +def train_export_model(featurepath: str, epochs: str, modelname: str, modelversion:str): + + import tensorflow as tf + from numpy import array + from tensorflow.keras.models import Sequential + from tensorflow.keras.layers import Dense + from tensorflow.keras.layers import Flatten, Dropout, Activation + from tensorflow.keras.layers import LSTM + import numpy as np + import requests + print("numpy version") + print(np.__version__) + import pandas as pd + import os + from featurestoresdk.feature_store_sdk import FeatureStoreSdk + from modelmetricsdk.model_metrics_sdk import ModelMetricsSdk + + fs_sdk = FeatureStoreSdk() + mm_sdk = ModelMetricsSdk() + print("featurepath is: ", featurepath) + features = fs_sdk.get_features(featurepath, ['pdcpBytesDl','pdcpBytesUl']) + print("Dataframe:") + print(features) + + features_cellc2b2 = features + print(features_cellc2b2) + print('Previous Data Types are --> ', features_cellc2b2.dtypes) + features_cellc2b2["pdcpBytesDl"] = pd.to_numeric(features_cellc2b2["pdcpBytesDl"], downcast="float") + features_cellc2b2["pdcpBytesUl"] = pd.to_numeric(features_cellc2b2["pdcpBytesUl"], downcast="float") + print('New Data Types are --> ', features_cellc2b2.dtypes) + + features_cellc2b2 = features_cellc2b2[['pdcpBytesDl', 'pdcpBytesUl']] + + def split_series(series, n_past, n_future): + X, y = list(), list() + for window_start in range(len(series)): + past_end = window_start + n_past + future_end = past_end + n_future + if future_end > len(series): + break + # slicing the past and future parts of the window + past, future = series[window_start:past_end, :], series[past_end:future_end, :] + X.append(past) + y.append(future) + return np.array(X), np.array(y) + X, y = split_series(features_cellc2b2.values,10, 1) + X = X.reshape((X.shape[0], X.shape[1],X.shape[2])) + y = y.reshape((y.shape[0], y.shape[2])) + print(X.shape) + print(y.shape) + + model = Sequential() + model.add(LSTM(units = 150, activation="tanh" ,return_sequences = True, input_shape = (X.shape[1], X.shape[2]))) + + model.add(LSTM(units = 150, return_sequences = True,activation="tanh")) + + model.add(LSTM(units = 150,return_sequences = False,activation="tanh" )) + + model.add((Dense(units = X.shape[2]))) + + model.compile(loss='mse', optimizer='adam',metrics=['mse']) + model.summary() + + model.fit(X, y, batch_size=10,epochs=int(epochs), validation_split=0.2) + yhat = model.predict(X, verbose = 0) + + + xx = y + yy = yhat + model.save("./") + import json + data = {} + data['metrics'] = [] + data['metrics'].append({'Accuracy': str(np.mean(np.absolute(np.asarray(xx)-np.asarray(yy))<5))}) + +# as new artifact after training will always be 1.0.0 + artifactversion="1.0.0" + url = f"http://modelmgmtservice.traininghost:8082/ai-ml-model-registration/v1/model-registrations/updateArtifact/{modelname}/{modelversion}/{artifactversion}" + updated_model_info= requests.post(url).json() + print(updated_model_info) + + mm_sdk.upload_metrics(data, modelname, modelversion,artifactversion) + mm_sdk.upload_model("./", modelname, modelversion, artifactversion) + +@dsl.pipeline( + name="qoe Pipeline", + description="qoe", +) +def super_model_pipeline( + featurepath: str, epochs: str, modelname: str, modelversion:str): + + trainop=train_export_model(featurepath=featurepath, epochs=epochs, modelname=modelname, modelversion=modelversion) + trainop.set_caching_options(False) + kubernetes.set_image_pull_policy(trainop, "IfNotPresent") + +pipeline_func = super_model_pipeline +file_name = "qoe_model_pipeline" + +kfp.compiler.Compiler().compile(pipeline_func, + '{}.yaml'.format(file_name)) + +import requests +pipeline_name="qoe_Pipeline" +pipeline_file = file_name+'.yaml' +requests.post("http://tm.traininghost:32002/pipelines/{}/upload".format(pipeline_name), files={'file':open(pipeline_file,'rb')}) \ No newline at end of file diff --git a/samples/qoe/qoe_pipeline_retraining_k_release.py b/samples/qoe/qoe_pipeline_retraining_k_release.py new file mode 100644 index 0000000..fbe29a5 --- /dev/null +++ b/samples/qoe/qoe_pipeline_retraining_k_release.py @@ -0,0 +1,218 @@ +# ================================================================================== +# +# Copyright (c) 2025 Samsung Electronics Co., Ltd. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# +# ================================================================================== + +import kfp +import kfp.dsl as dsl +from kfp.dsl import InputPath, OutputPath +from kfp.dsl import component as component +from kfp import kubernetes + +BASE_IMAGE = "traininghost/pipelineimage:latest" + +@component(base_image=BASE_IMAGE,packages_to_install=['requests']) +def train_export_model(featurepath: str, epochs: str, modelname: str, modelversion:str): + + import re + import tensorflow as tf + from numpy import array + from tensorflow.keras.models import Sequential + from tensorflow.keras.layers import Dense + from tensorflow.keras.layers import Flatten, Dropout, Activation + from tensorflow.keras.layers import LSTM + import numpy as np + import requests + import zipfile + print("numpy version") + print(np.__version__) + import pandas as pd + import os + from featurestoresdk.feature_store_sdk import FeatureStoreSdk + from modelmetricsdk.model_metrics_sdk import ModelMetricsSdk + + fs_sdk = FeatureStoreSdk() + mm_sdk = ModelMetricsSdk() + print("featurepath is: ", featurepath) + features = fs_sdk.get_features(featurepath, ['pdcpBytesDl','pdcpBytesUl']) + print("Dataframe:") + print(features) + + features_cellc2b2 = features + print(features_cellc2b2) + print('Previous Data Types are --> ', features_cellc2b2.dtypes) + features_cellc2b2["pdcpBytesDl"] = pd.to_numeric(features_cellc2b2["pdcpBytesDl"], downcast="float") + features_cellc2b2["pdcpBytesUl"] = pd.to_numeric(features_cellc2b2["pdcpBytesUl"], downcast="float") + print('New Data Types are --> ', features_cellc2b2.dtypes) + + features_cellc2b2 = features_cellc2b2[['pdcpBytesDl', 'pdcpBytesUl']] + + def split_series(series, n_past, n_future): + X, y = list(), list() + for window_start in range(len(series)): + past_end = window_start + n_past + future_end = past_end + n_future + if future_end > len(series): + break + # slicing the past and future parts of the window + past, future = series[window_start:past_end, :], series[past_end:future_end, :] + X.append(past) + y.append(future) + return np.array(X), np.array(y) + X, y = split_series(features_cellc2b2.values,10, 1) + X = X.reshape((X.shape[0], X.shape[1],X.shape[2])) + y = y.reshape((y.shape[0], y.shape[2])) + print(X.shape) + print(y.shape) + + print("Loading the saved model") + print(os.listdir(os.getcwd())) + + + url = f"http://modelmgmtservice.traininghost:8082/ai-ml-model-discovery/v1/models/?model-name={modelname}&model-version={modelversion}" + modelinfo = requests.get(url).json()[0] + artifactversion = modelinfo["modelId"]["artifactVersion"] + model_url = "" + if modelinfo["modelLocation"] != "": + model_url= modelinfo["modelLocation"] + else : + model_url = f"http://tm.traininghost:32002/model/{modelname}/{modelversion}/{artifactversion}/Model.zip" + # Download the model zip file + + print(f"Downloading model from :{model_url}") + response = requests.get(model_url) + + print("Response generated: " + str(response)) + + # Check if the request was successful + if response.status_code == 200: + local_file_path = 'Model.zip' + with open(local_file_path, 'wb') as file: + file.write(response.content) + print(f'Downloaded file saved to {local_file_path}') + else: + print('Failed to download the file') + + print(os.listdir(os.getcwd())) + + # Extract the zip file + zip_file_path = "./Model.zip" + extract_to_dir = "./Model" + + if not os.path.exists(extract_to_dir): + os.makedirs(extract_to_dir) + + with zipfile.ZipFile(zip_file_path, 'r') as zip_ref: + zip_ref.extractall(extract_to_dir) + + # Delete the zip file after extraction + if os.path.exists(zip_file_path): + os.remove(zip_file_path) + print(f'Deleted zip file: {zip_file_path}') + else: + print(f'Zip file not found: {zip_file_path}') + + # Path to the directory containing the saved model + model_path = f"./Model/{modelversion}" + + # Load the model in SavedModel format + model = tf.keras.models.load_model(model_path) + + model.compile(loss='mse', optimizer='adam', metrics=['mse']) + model.summary() + + # Define a directory to save checkpoints + checkpoint_dir = "./checkpoints" + if not os.path.exists(checkpoint_dir): + os.makedirs(checkpoint_dir) + + # Define a ModelCheckpoint callback + checkpoint_path = os.path.join(checkpoint_dir, "model_epoch_{epoch:02d}_val_loss_{val_loss:.2f}.h5") + checkpoint_callback = tf.keras.callbacks.ModelCheckpoint( + filepath=checkpoint_path, # Save checkpoint file path, this file is not saved finaly + monitor='val_loss', # Monitor validation loss, can be train loss also + save_best_only=True, # Save only the best model based on validation loss + save_weights_only=False, # Save the entire model, not just weights + mode='min', # Minimizing the validation loss + verbose=0 # set to 1 if want to print info when a new checkpoint is saved + ) + + # Train the model with checkpointing + print("Retraining the model with checkpoints...") + history = model.fit( + X, + y, + batch_size=10, + epochs=int(epochs), + validation_split=0.2, + callbacks=[checkpoint_callback] # Add the callback here + ) + + yhat = model.predict(X, verbose = 0) + xx = y + yy = yhat + + retrained_model_path = "./retrain" + if not os.path.exists(retrained_model_path): + os.makedirs(retrained_model_path) + + # Save the retrained model + model.save(retrained_model_path) + print(f"Retrained model saved at {retrained_model_path}") + + import json + data = {} + data['metrics'] = [] + data['metrics'].append({'Accuracy': str(np.mean(np.absolute(np.asarray(xx)-np.asarray(yy))<5))}) + +# update artifact version + new_artifactversion ="" + if modelinfo["modelLocation"] != "": + new_artifactversion = "1.1.0" + else: + major, minor , patch= map(int, artifactversion.split('.')) + minor+=1 + new_artifactversion = f"{major}.{minor}.{patch}" + + # update the new artifact version in mme + url = f"http://modelmgmtservice.traininghost:8082/ai-ml-model-registration/v1/model-registrations/updateArtifact/{modelname}/{modelversion}/{new_artifactversion}" + updated_model_info= requests.post(url).json() + print(updated_model_info) + + mm_sdk.upload_metrics(data, modelname, modelversion,new_artifactversion) + mm_sdk.upload_model("./retrain/", modelname, modelversion, new_artifactversion) + +@dsl.pipeline( + name="qoe Pipeline", + description="qoe", +) +def super_model_pipeline( + featurepath: str, epochs: str, modelname: str, modelversion:str): + + trainop=train_export_model(featurepath=featurepath, epochs=epochs, modelname=modelname, modelversion=modelversion) + trainop.set_caching_options(False) + kubernetes.set_image_pull_policy(trainop, "IfNotPresent") + +pipeline_func = super_model_pipeline +file_name = "qoe_model_pipeline_retrain" + +kfp.compiler.Compiler().compile(pipeline_func, + '{}.yaml'.format(file_name)) + +import requests +pipeline_name="qoe_Pipeline_retrain" +pipeline_file = file_name+'.yaml' +requests.post("http://tm.traininghost:32002/pipelines/{}/upload".format(pipeline_name), files={'file':open(pipeline_file,'rb')}) \ No newline at end of file