update service data

script to optimize pytorch model on server
2023-04-18 17:13:15 +08:00 · 2023-04-18 17:13:05 +08:00
3 changed files with 145 additions and 0 deletions
--- a/optimize_model.py
+++ b/optimize_model.py
@ -0,0 +1,47 @@
 # optimize_model.py
 #
 # author: deng
 # date  : 20230418
 import shutil
 from pathlib import Path
 import torch
 import mlflow
 def optimize_pytorch_model(run_id: str) -> None:
    """Optimize Pytorch model on MLflow server, the optimized model will be sent back
    Args:
        run_id (str): mlflow run id
    """
    download_path = Path('./model/downloaded_pytorch_model')
    if download_path.is_dir():
        print(f'Remove existed dir: {download_path}')
        shutil.rmtree(download_path)
    # Download Pytorch model to local file system
    mlflow_model = mlflow.pytorch.load_model(f'runs:/{run_id}/model')
    mlflow.pytorch.save_model(mlflow_model, download_path)
    # Optimize model
    model = torch.load(download_path.joinpath('data/model.pth'))
    dummy_input = torch.randn(5)
    torch.onnx.export(model, dummy_input, download_path.joinpath('data/model.onnx'))
    # we can not call TensorRT on macOS, so imagine we get a serialized model
    download_path.joinpath('data/model.trt').touch()
    # Save optimized model to given run
    with mlflow.start_run(run_id=run_id):
        mlflow.log_artifact(download_path.joinpath('data/model.trt'), 'model/data')
        print(f'Optimized model had been uploaded to server: {mlflow.get_tracking_uri()}')
 if __name__ == '__main__':
    mlflow.set_tracking_uri('http://127.0.0.1:5001')
    optimize_pytorch_model(
        run_id='f1b7b9a5ba934f158c07975a8a332de5'
    )
--- a/service/artifacts/3/f1b7b9a5ba934f158c07975a8a332de5/artifacts/code/train.py
+++ b/service/artifacts/3/f1b7b9a5ba934f158c07975a8a332de5/artifacts/code/train.py
@ -0,0 +1,98 @@
 # train.py
 #
 # author: deng
 # date  : 20230221
 import torch
 import torch.nn as nn
 from torch.optim import SGD
 import mlflow
 from mlflow.models.signature import ModelSignature
 from mlflow.types.schema import Schema, ColSpec
 from tqdm import tqdm
 class Net(nn.Module):
    """ define a simple neural network model """
    def __init__(self):
        super(Net, self).__init__()
        self.fc1 = nn.Linear(5, 3)
        self.fc2 = nn.Linear(3, 1)
    def forward(self, x):
        x = self.fc1(x)
        x = torch.relu(x)
        x = self.fc2(x)
        return x
 def train(model, dataloader, criterion, optimizer, epochs):
    """ define the training function """
    for epoch in tqdm(range(epochs), 'Epochs'):
        for batch, (inputs, labels) in enumerate(dataloader):
            # forwarding
            outputs = model(inputs)
            loss = criterion(outputs, labels)
            # update gradient
            optimizer.zero_grad()
            loss.backward()
            optimizer.step()
        # log loss
        mlflow.log_metric('train_loss', loss.item(), step=epoch)
    return loss
 if __name__ == '__main__':
    # set hyper parameters
    learning_rate = 1e-2
    batch_size = 10
    epochs = 20
    # create a dataloader with fake data
    dataloader = [(torch.randn(5), torch.randn(1)) for _ in range(100)]
    dataloader = torch.utils.data.DataLoader(dataloader, batch_size=batch_size)
    # create the model, criterion, and optimizer
    model = Net()
    criterion = nn.MSELoss()
    optimizer = SGD(model.parameters(), lr=learning_rate)
    # set the tracking URI to the model registry
    mlflow.set_tracking_uri('http://127.0.0.1:5001')
    mlflow.set_experiment('train_fortune_predict_model')
    # start a new MLflow run
    with mlflow.start_run():
        # train the model
        loss = train(model, dataloader, criterion, optimizer, epochs)
        # log some additional metrics
        mlflow.log_metric('final_loss', loss.item())
        mlflow.log_param('learning_rate', learning_rate)
        mlflow.log_param('batch_size', batch_size)
        # create a signature to record model input and output info
        input_schema = Schema([
            ColSpec('float', 'age'),
            ColSpec('float', 'mood level'),
            ColSpec('float', 'health level'),
            ColSpec('float', 'hungry level'),
            ColSpec('float', 'sexy level')
        ])
        output_schema = Schema([ColSpec('float', 'fortune')])
        signature = ModelSignature(inputs=input_schema, outputs=output_schema)
        # log trained model
        mlflow.pytorch.log_model(model, 'model', signature=signature)
        # log training code
        mlflow.log_artifact('./train.py', 'code')
    print('Completed.')
--- a/service/backend.db
+++ b/service/backend.db
Author	SHA1	Message	Date
deng	e1f143736e	update service data	2023-04-18 17:13:15 +08:00
deng	3c39c48242	script to optimize pytorch model on server	2023-04-18 17:13:05 +08:00