McxClientApp Data Logger

This section will show a simple example of the McxClientApp template used for data logging

13 minute read

This example will demonstrate how to create a simple client application using the McxClientApp template for data logging purposes. The application will connect to a Motorcortex server, subscribe to specific parameters, and log the received data to a CSV file.

It is a bare example where many additional features such as, for example, trigger logging from the GUI or automatically splitting to new csvs when they get too big, are left as an exercise for the reader to implement and can be created with basic Python knowledge.

Code

With a subscriber thread running in the background to receive data from the server, the main application loop will periodically writing the queue of data to a CSV file. We will go over the code in steps below but you can also go through the complete code yourself.

Show the full code

The code can also be found in the example folder of the mcx-client-app-template repository under examples/datalogger.py.

import sys
from pathlib import Path

# Add parent directory to path to import mcx_client_app
sys.path.insert(0, str(Path(__file__).parent.parent))

from src.mcx_client_app import McxClientApp, McxClientAppOptions, ThreadSafeValue
from motorcortex import Subscription
import os
import csv
from datetime import datetime # For timestamping files
from queue import Queue # Thread-safe queue
import time
import logging


def timespec_to_msec(timestamp):
    return timestamp.sec * 1000 + timestamp.nsec / 1000000
    
class dataLoggerClientApp(McxClientApp):
    """
    Application that implements thread-safe data logging with subscriptions.
    Data is collected from subscription callbacks and saved to CSV in the action thread.
    """
    def __init__(self, options: McxClientAppOptions, paths: list[str], file_path: str, divider: int = 10, save_interval: int = 10, batch_size: int = 100):
        """Initialize the data logger client app.
        
        Args:
            options (McxClientAppOptions): Options for the MCX client app.
            paths (list[str]): List of parameter paths to log.
            file_path (str): Path to the file where data will be logged.
            divider (int, optional): Frequency divider for logging. Defaults to 10.
            save_interval (int, optional): Interval for saving data to file in seconds. Defaults to 10.
            batch_size (int, optional): Maximum items to process per iteration. Defaults to 100.
        """
        super().__init__(options)
        self.__subscription: Subscription = None # Placeholder for subscription
        self.__paths = paths # List of parameter paths to log
        self.__file_path = file_path # Path to the file where data will be logged
        self.__divider = divider # Frequency divider for logging
        self.__save_interval = save_interval # Optional: Interval for saving data to file in seconds
        self.__batch_size = batch_size # Maximum items to process per iteration
        self.__data_queue: Queue = Queue()  # Unbounded thread-safe queue
        self.__buffer: list[dict] = []  # Buffer to accumulate data before writing
        self.__last_save_time: float = time.time() # Last time data was saved
        self.__field_mapping: dict = {}  # Maps path to expanded field names
        self.__fieldnames: list[str] = []  # All CSV column names
        
    def startOp(self) -> None:
        """Start the data logging operation by subscribing to parameters."""
        logging.info(f"Subscribing to {len(self.__paths)} parameters...")
        self.__subscription = self.sub.subscribe(
            self.__paths, 
            "DataLoggerGroup", 
            frq_divider=self.__divider
        )
        self.__subscription.notify(self.__sub_callback)
        
        # Initialize CSV file with headers
        self.__initialize_csv()
        logging.info("Data logger initialized and subscribed.")
        
    def __get_unique_filepath(self) -> str:
        """Get a unique filepath by appending date and time.
        
        Returns:
            str: Unique filepath (e.g., robot_data_2024-12-12_14-30-45.csv)
        """
        # Split path into directory, name, and extension
        directory = os.path.dirname(self.__file_path)
        basename = os.path.basename(self.__file_path)
        name, ext = os.path.splitext(basename)
        
        # Append current date and time
        timestamp = datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
        new_filepath = os.path.join(directory, f"{name}_{timestamp}{ext}")
        
        return new_filepath
    
    def __initialize_csv(self) -> None:
        """Initialize the CSV file with headers."""
        # Get unique filepath if file already exists
        self.__file_path = self.__get_unique_filepath()
        
        # Ensure directory exists
        os.makedirs(os.path.dirname(self.__file_path), exist_ok=True)
        
        # Get parameter tree to determine array sizes
        tree = self.parameter_tree.getParameterTree()
        
        # Build expanded fieldnames for arrays/matrices
        expanded_fieldnames = ['timestamp']
        self.__field_mapping = {}  # Maps original path to list of expanded field names
        
        for path in self.__paths:
            # Find parameter info in tree
            param_info = None
            for param in tree:
                if param.path == path:
                    param_info = param
                    break
            
            if param_info and param_info.number_of_elements > 1:
                # Array/matrix - expand into multiple columns
                field_list = []
                for i in range(param_info.number_of_elements):
                    field_name = f"{path}[{i}]"
                    expanded_fieldnames.append(field_name)
                    field_list.append(field_name)
                self.__field_mapping[path] = field_list
            else:
                # Scalar - single column
                expanded_fieldnames.append(path)
                self.__field_mapping[path] = [path]
        
        self.__fieldnames = expanded_fieldnames
        
        # Write header row
        with open(self.__file_path, 'w', newline='') as csvfile:
            writer = csv.DictWriter(csvfile, fieldnames=self.__fieldnames)
            writer.writeheader()
        logging.info(f"CSV file initialized: {self.__file_path}")
        logging.info(f"Field mapping: {self.__field_mapping}")
        
    def __sub_callback(self, msg) -> None:
        """Callback for subscription updates (runs in subscription thread).
        
        Args:
            msg: Message containing updated parameter values.
        """
        # Collect all values from this message with timestamp
        data_row = {'timestamp': timespec_to_msec(msg[0].timestamp)}
        
        for item, param in enumerate(msg):
            path = self.__paths[item]
            value = param.value
            
            # Get the field names for this path
            field_names = self.__field_mapping.get(path, [path])
            
            if len(field_names) == 1:
                # Scalar value
                data_row[field_names[0]] = value[0] if isinstance(value, (list, tuple)) and len(value) > 0 else value
            else:
                # Array/matrix - split into individual columns
                for i, field_name in enumerate(field_names):
                    data_row[field_name] = value[i] if i < len(value) else None
        
        # Put data in thread-safe queue (unbounded, no blocking)
        self.__data_queue.put(data_row)
            
    def __save_data(self) -> None:
        """Save buffered data to CSV file."""
        if not self.__buffer:
            return
            
        try:
            with open(self.__file_path, 'a', newline='') as csvfile:
                writer = csv.DictWriter(csvfile, fieldnames=self.__fieldnames)
                writer.writerows(self.__buffer)
            
            logging.info(f"Saved {len(self.__buffer)} rows to {self.__file_path}")
            self.__buffer.clear()
            self.__last_save_time = time.time()
        except Exception as e:
            logging.error(f"Error saving data: {e}")
                
    def action(self) -> None:
        """Perform the data logging action (runs in action thread).
        
        Retrieves data from the queue in batches and saves it periodically to CSV.
        """
        # Process up to batch_size items from queue
        processed = 0
        
        while processed < self.__batch_size and not self.__data_queue.empty():
            data_row = self.__data_queue.get()
            self.__buffer.append(data_row)
            processed += 1
        
        # Check if it's time to save to file
        current_time = time.time()
        should_save = (current_time - self.__last_save_time >= self.__save_interval) or len(self.__buffer) >= 1000
        
        if should_save:
            self.__save_data()
    
    def onExit(self) -> None:
        """Cleanup: save any remaining buffered data before exit."""
        logging.info("Saving remaining data before exit...")
        
        # Check if it's time to save to file
        current_time = time.time()
        should_save = (current_time - self.__last_save_time >= self.__save_interval) or len(self.__buffer) >= 1000
        
        if should_save:
            self.__save_data()
        
        # Small sleep to prevent busy waiting and block the stop signal
        self.wait(0.1, block_stop_signal=True)
        
        remaining = 0
        while not self.__data_queue.empty():
            data_row = self.__data_queue.get()
            self.__buffer.append(data_row)
            remaining += 1
            
            if len(self.__buffer) >= self.__batch_size:
                self.__save_data()
        
        if remaining > 0:
            logging.info(f"Processing {remaining} remaining samples from queue...")
        
        # Save final buffer
        self.__save_data()
        logging.info("Data logger cleanup complete.")
        
if __name__ == "__main__":
    options = McxClientAppOptions(
        login="",
        password="",
        target_url=""
    )
    
    # Example parameters to log
    paths_to_log = [
        "root/ManipulatorControl/jointPositionsTarget",
        "root/ManipulatorControl/jointPositionsActual",
    ]
    
    # Log file path
    log_file = "./data/robot_data.csv"
    
    app = dataLoggerClientApp(
        options=options,
        paths=paths_to_log,
        file_path=log_file,
        divider=10,  # Log every 10th message
        batch_size=100,  # Process max 100 items per iteration
        save_interval=3  # Save to file every 10 seconds
    )
    app.run()

1. Import necessary modules and set up the class

Firstly, we import the required modules and define our dataLoggerClientApp class that inherits from McxClientApp. This class will handle the subscription to parameters and logging of data. We will use the startOp, action, and onExit methods to manage the lifecycle of our application.

import sys
from pathlib import Path

# Add parent directory to path to import mcx_client_app
sys.path.insert(0, str(Path(__file__).parent.parent))

from src.mcx_client_app import McxClientApp, McxClientAppOptions, ThreadSafeValue
from motorcortex import Subscription
import os
import csv
from datetime import datetime # For timestamping files
from queue import Queue # Thread-safe queue
import time
import logging
    
class dataLoggerClientApp(McxClientApp):
    """
    Application that implements thread-safe data logging with subscriptions.
    Data is collected from subscription callbacks and saved to CSV in the action thread.
    """
    def __init__(self, options: McxClientAppOptions, paths: list[str], file_path: str, divider: int = 10, save_interval: int = 10, batch_size: int = 100):
        """Initialize the data logger client app.
        
        Args:
            options (McxClientAppOptions): Options for the MCX client app.
            paths (list[str]): List of parameter paths to log.
            file_path (str): Path to the file where data will be logged.
            divider (int, optional): Frequency divider for logging. Defaults to 10.
            save_interval (int, optional): Interval for saving data to file in seconds. Defaults to 10.
            batch_size (int, optional): Maximum items to process per iteration. Defaults to 100.
        """
        super().__init__(options)
        self.__paths = paths # List of parameter paths to log
        self.__file_path = file_path # Path to the file where data will be logged
        self.__divider = divider # Frequency divider for logging
        self.__save_interval = save_interval # Optional: Interval for saving data to file in seconds
        self.__batch_size = batch_size # Maximum items to process per iteration
        
    def startOp(self) -> None:
        """Start the data logging operation by subscribing to parameters."""
        pass
                
    def action(self) -> None:
        """Perform the data logging action (runs in action thread).
        
        Retrieves data from the queue in batches and saves it periodically to CSV.
        """
        pass
    
    def onExit(self) -> None:
        """Cleanup: save any remaining buffered data before exit."""
        pass

The dataLoggerClientApp class initialises with the necessary parameters for the base class McxClientApp, as well as the list of parameter paths to log, the file path for logging, and optional parameters for frequency division, save interval, and batch size.

2. Implement the subscription and data handling

In the startOp method, we subscribe to the specified parameters and set up a callback function to handle incoming data. The callback function will store the received data in a thread-safe queue for later processing. Do not forget to add initialise the variables in the __init__ method as shown in the complete code below.

def timespec_to_msec(timestamp):
    return timestamp.sec * 1000 + timestamp.nsec / 1000000

def __init__(self, options: McxClientAppOptions, paths: list[str], file_path: str, divider: int = 10, save_interval: int = 10, batch_size: int = 100):
    # Previous initialization code...
    self.__subscription: Subscription = None # Placeholder for subscription
    self.__data_queue: Queue = Queue()  # Unbounded thread-safe queue
    self.__field_mapping = {}  # Maps path to expanded field names

def startOp(self) -> None: # Overwrite the startOp method
    """Start the data logging operation by subscribing to parameters."""
    logging.info(f"Subscribing to {len(self.__paths)} parameters...")
    self.__subscription = self.sub.subscribe(
        self.__paths, 
        "DataLoggerGroup", 
        frq_divider=self.__divider
    )
    self.__subscription.notify(self.__sub_callback)


def __sub_callback(self, msg) -> None: # This is the subscription callback and also part of the class
    """Callback for subscription updates (runs in subscription thread).
    
    Args:
        msg: Message containing updated parameter values.
    """
    # Collect all values from this message with timestamp
    data_row = {'timestamp': timespec_to_msec(msg[0].timestamp)}
    
    for item, param in enumerate(msg):
        path = self.__paths[item]
        value = param.value
        
        # Get the field names for this path
        field_names = self.__field_mapping.get(path, [path])
        
        if len(field_names) == 1:
            # Scalar value
            data_row[field_names[0]] = value[0] if isinstance(value, (list, tuple)) and len(value) > 0 else value
        else:
            # Array/matrix - split into individual columns
            for i, field_name in enumerate(field_names):
                data_row[field_name] = value[i] if i < len(value) else None
    
    # Put data in thread-safe queue (unbounded, no blocking)
    self.__data_queue.put(data_row)

The self.__fieldmapping dictionary is used to map parameter paths to their corresponding expanded field names in the CSV file, especially for array or matrix parameters. This will be populated in the CSV initialization step.

The helper function timespec_to_msec converts the timestamp from the Motorcortex timespec format to milliseconds for easier logging.

3. Initialize the CSV file

We need to create a method to initialize the CSV file with appropriate headers based on the parameters being logged.

def __initialize_csv(self) -> None:
    """Initialize the CSV file with headers."""
    # Get unique filepath if file already exists
    self.__file_path = self.__get_unique_filepath()
    
    # Ensure directory exists
    os.makedirs(os.path.dirname(self.__file_path), exist_ok=True)
    
    # Get parameter tree to determine array sizes
    tree = self.parameter_tree.getParameterTree()
    
    # Build expanded fieldnames for arrays/matrices
    expanded_fieldnames = ['timestamp']
    self.__field_mapping = {}  # Maps original path to list of expanded field names
    
    for path in self.__paths:
        # Find parameter info in tree
        param_info = None
        for param in tree:
            if param.path == path:
                param_info = param
                break
        
        if param_info and param_info.number_of_elements > 1:
            # Array/matrix - expand into multiple columns
            field_list = []
            for i in range(param_info.number_of_elements):
                field_name = f"{path}[{i}]"
                expanded_fieldnames.append(field_name)
                field_list.append(field_name)
            self.__field_mapping[path] = field_list
        else:
            # Scalar - single column
            expanded_fieldnames.append(path)
            self.__field_mapping[path] = [path]
    
    self.__fieldnames = expanded_fieldnames
    
    # Write header row
    with open(self.__file_path, 'w', newline='') as csvfile:
        writer = csv.DictWriter(csvfile, fieldnames=self.__fieldnames)
        writer.writeheader()
    logging.info(f"CSV file initialized: {self.__file_path}")
    logging.info(f"Field mapping: {self.__field_mapping}")

This method creates the CSV file and writes the header row based on the parameters being logged. It also handles expanding array or matrix parameters into multiple columns. It relies on a helper method __get_unique_filepath to avoid overwriting existing files.

def __get_unique_filepath(self) -> str:
    """Get a unique filepath by appending date and time.
    
    Returns:
        str: Unique filepath (e.g., robot_data_2024-12-12_14-30-45.csv)
    """
    # Split path into directory, name, and extension
    directory = os.path.dirname(self.__file_path)
    basename = os.path.basename(self.__file_path)
    name, ext = os.path.splitext(basename)
    
    # Append current date and time
    timestamp = datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
    new_filepath = os.path.join(directory, f"{name}_{timestamp}{ext}")
    
    return new_filepath

Again, do not forget to initialise the variables in the __init__ method and call the __initialize_csv method in the startOp method.

def __init__(self, options: McxClientAppOptions, paths: list[str], file_path: str, divider: int = 10, save_interval: int = 10, batch_size: int = 100):
    # Previous initialization code...
    self.__fieldnames: list[str] = []  # All CSV column names

def startOp(self) -> None: # Overwrite the startOp method
    # Previous startOp code...

    # Initialize CSV file with headers
    self.__initialize_csv()
    logging.info("Data logger initialized and subscribed.")

4. Implement the action method for data saving

Now that the subscriber puts the data in a thread-safe queue, we need to implement the action method to periodically save this data to the CSV file.

def __init__(self, options: McxClientAppOptions, paths: list[str], file_path: str, divider: int = 10, save_interval: int = 10, batch_size: int = 100):
    # Previous initialization code...
    self.__buffer: list[dict] = []  # Buffer to accumulate data before writing
    self.__last_save_time: float = time.time() # Time of last save

def __save_data(self) -> None:
    """Save buffered data to CSV file."""
    if not self.__buffer:
        return
        
    try:
        with open(self.__file_path, 'a', newline='') as csvfile:
            writer = csv.DictWriter(csvfile, fieldnames=self.__fieldnames)
            writer.writerows(self.__buffer)
        
        logging.info(f"Saved {len(self.__buffer)} rows to {self.__file_path}")
        self.__buffer.clear()
        self.__last_save_time = time.time()
    except Exception as e:
        logging.error(f"Error saving data: {e}")
            
def action(self) -> None:
    """Perform the data logging action (runs in action thread).
    
    Retrieves data from the queue in batches and saves it periodically to CSV.
    """
    # Process up to batch_size items from queue
    processed = 0
    
    while processed < self.__batch_size and not self.__data_queue.empty():
        data_row = self.__data_queue.get()
        self.__buffer.append(data_row)
        processed += 1
    
    # Check if it's time to save to file
    current_time = time.time()
    should_save = (current_time - self.__last_save_time >= self.__save_interval) or len(self.__buffer) >= 1000
    
    if should_save:
        self.__save_data()

The action method processes data from the queue in batches and saves it to the CSV file either when a certain time interval has passed or when the buffer reaches a certain size. The time interval is important in the case that the subscriber adds data faster to the queue than the action method can process it. If no interval is used, the buffer may never get saved if the queue is constantly filled. The __save_data method handles the actual writing to the CSV file.

5. Implement the cleanup in onExit

Finally, we need to ensure that any remaining data in the queue is saved when the application is exiting. This is done in the onExit method.

def onExit(self) -> None:
    """Cleanup: save any remaining buffered data before exit."""
    logging.info("Saving remaining data before exit...")
    
    # Check if it's time to save to file
    current_time = time.time()
    should_save = (current_time - self.__last_save_time >= self.__save_interval) or len(self.__buffer) >= 1000
    
    if should_save:
        self.__save_data()
    
    # Small sleep to prevent busy waiting and block the stop signal
    self.wait(0.1, block_stop_signal=True)
    
    remaining = 0
    while not self.__data_queue.empty():
        data_row = self.__data_queue.get()
        self.__buffer.append(data_row)
        remaining += 1
        
        if len(self.__buffer) >= self.__batch_size:
            self.__save_data()
    
    if remaining > 0:
        logging.info(f"Processing {remaining} remaining samples from queue...")
    
    # Save final buffer
    self.__save_data()
    logging.info("Data logger cleanup complete.")

6. Running the application

Finally, we can create an instance of our dataLoggerClientApp and run it. We need to provide the necessary options, paths to log, and the file path for logging.

if __name__ == "__main__":
    options = McxClientAppOptions(
        login="",
        password="",
        target_url=""
    )
    
    # Example parameters to log
    paths_to_log = [
        "root/ManipulatorControl/jointPositionsTarget",
        "root/ManipulatorControl/jointPositionsActual",
    ]
    
    # Log file path
    log_file = "./data/robot_data.csv"
    
    app = dataLoggerClientApp(
        options=options,
        paths=paths_to_log,
        file_path=log_file,
        divider=10,  # Log every 10th message
        batch_size=100,  # Process max 100 items per iteration
        save_interval=3  # Save to file every 10 seconds
    )
    app.run()