cimp-impl/export_resnet_raw.py


								import torch

								import torch.nn as nn

								import os

								import argparse

								import sys

								from collections import OrderedDict


								# Add ltr to path to import ResNet

								workspace_root = os.path.abspath(os.path.join(os.path.dirname(__file__), '.'))

								print(f"Workspace root: {workspace_root}")

								ltr_path = os.path.join(workspace_root, 'ltr')

								if not os.path.isdir(ltr_path):

								    print(f"Error: 'ltr' directory not found in {workspace_root}")

								    sys.exit(1)

								sys.path.insert(0, workspace_root)


								try:

								    # We might not strictly need resnet50 from ltr if loading a JIT model,

								    # but good to have for potential type checking or structure reference.

								    from ltr.models.backbone.resnet import resnet50

								    print("Successfully imported ResNet from ltr.models.backbone.resnet")

								except ImportError as e:

								    print(f"Warning: Could not import ResNet from ltr.models.backbone.resnet: {e}")

								    # Depending on the JIT model, this might not be fatal.


								class TensorContainer(nn.Module):

								    def __init__(self, tensor_to_wrap, tensor_name="tensor"):

								        super().__init__()

								        # Can't use register_buffer or register_parameter as these expect string keys

								        # that are valid python identifiers. setattr works for general attributes.

								        setattr(self, tensor_name, tensor_to_wrap)


								def convert_param_name_to_filename(param_name):

								    """Converts a PyTorch parameter name (e.g., layer1.0.conv1.weight)

								       to the underscore-separated filename convention (e.g., layer1_0_conv1_weight.pt).

								    """

								    return param_name.replace('.', '_') + '.pt'


								def load_weights_from_individual_files(model_to_populate, source_dir):

								    print(f"Attempting to load weights from individual files in: {source_dir} using underscore naming convention.")

								    new_state_dict = OrderedDict()

								    loaded_count = 0

								    missed_params = []

								    missed_buffers = []


								    # Parameters

								    for name, param_tensor_template in model_to_populate.named_parameters():

								        expected_filename = convert_param_name_to_filename(name)

								        filepath = os.path.join(source_dir, expected_filename)


								        if os.path.exists(filepath):

								            try:

								                # print(f"  Loading parameter: {name} from {filepath}")

								                tensor_data = torch.load(filepath, map_location=torch.device('cpu'))


								                if isinstance(tensor_data, torch.jit.ScriptModule):

								                    # If it's a JIT module (e.g. from previous save attempts or other sources)

								                    # try to extract the tensor, assuming it was wrapped with a known key like 'tensor'

								                    # or if it's a module with a single parameter/buffer.

								                    try:

								                        tensor_data = tensor_data.attr("tensor").toTensor()

								                        print(f"    INFO: Extracted tensor via .attr('tensor') from ScriptModule: {filepath}")

								                    except RuntimeError:

								                        params = list(tensor_data.parameters())

								                        buffers = list(tensor_data.buffers())

								                        if len(params) == 1:

								                            tensor_data = params[0]

								                            print(f"    INFO: Extracted tensor from single parameter of ScriptModule: {filepath}")

								                        elif len(buffers) == 1 and not params:

								                            tensor_data = buffers[0]

								                            print(f"    INFO: Extracted tensor from single buffer of ScriptModule: {filepath}")

								                        else:

								                            raise ValueError(f"ScriptModule at {filepath} doesn't have .attr('tensor') and not single param/buffer.")


								                if not isinstance(tensor_data, torch.Tensor):

								                    raise TypeError(f"Loaded data from {filepath} is not a tensor (type: {type(tensor_data)})")


								                if tensor_data.shape != param_tensor_template.data.shape:

								                    print(f"    WARNING: Shape mismatch for param {name}. Expected {param_tensor_template.data.shape}, got {tensor_data.shape} from {filepath}. Skipping.")

								                    missed_params.append(name)

								                    continue

								                new_state_dict[name] = tensor_data

								                loaded_count += 1

								            except Exception as e:

								                print(f"    ERROR loading or processing {filepath} for param {name}: {e}. Skipping.")

								                missed_params.append(name)

								        else:

								            # print(f"  File not found for parameter {name}: {filepath}. Will be missed.")

								            missed_params.append(name)


								    # Buffers

								    for name, buffer_tensor_template in model_to_populate.named_buffers():

								        expected_filename = convert_param_name_to_filename(name)

								        filepath = os.path.join(source_dir, expected_filename)

								        if os.path.exists(filepath):

								            try:

								                # print(f"  Loading buffer: {name} from {filepath}")

								                tensor_data = torch.load(filepath, map_location=torch.device('cpu'))


								                if isinstance(tensor_data, torch.jit.ScriptModule):

								                    try:

								                        tensor_data = tensor_data.attr("tensor").toTensor()

								                        print(f"    INFO: Extracted tensor via .attr('tensor') from ScriptModule: {filepath}")

								                    except RuntimeError:

								                        params = list(tensor_data.parameters())

								                        buffers = list(tensor_data.buffers())

								                        if len(buffers) == 1 and not params:

								                            tensor_data = buffers[0]

								                            print(f"    INFO: Extracted tensor from single buffer of ScriptModule: {filepath}")

								                        elif len(params) == 1 and not buffers:

								                             tensor_data = params[0]

								                             print(f"    INFO: Extracted tensor from single param of ScriptModule: {filepath}")

								                        else:

								                            raise ValueError(f"ScriptModule at {filepath} doesn't have .attr('tensor') and not single param/buffer.")


								                if not isinstance(tensor_data, torch.Tensor):

								                    raise TypeError(f"Loaded data from {filepath} is not a tensor (type: {type(tensor_data)})")


								                if tensor_data.shape != buffer_tensor_template.data.shape:

								                    print(f"    WARNING: Shape mismatch for buffer {name}. Expected {buffer_tensor_template.data.shape}, got {tensor_data.shape} from {filepath}. Skipping.")

								                    missed_buffers.append(name)

								                    continue

								                new_state_dict[name] = tensor_data

								                loaded_count += 1

								            except Exception as e:

								                print(f"    ERROR loading or processing {filepath} for buffer {name}: {e}. Skipping.")

								                missed_buffers.append(name)

								        else:

								            # print(f"  File not found for buffer {name}: {filepath}. Will be missed.")

								            missed_buffers.append(name)


								    if loaded_count > 0:

								        print(f"Attempting to load {loaded_count} found tensors into model state_dict.")

								        result = model_to_populate.load_state_dict(new_state_dict, strict=False)

								        print("State_dict loading result:")

								        if result.missing_keys:

								            print(f"  Strict load missing_keys ({len(result.missing_keys)}): {result.missing_keys[:20]}...") # Print first 20

								        if result.unexpected_keys:

								            print(f"  Strict load unexpected_keys ({len(result.unexpected_keys)}): {result.unexpected_keys[:20]}...")


								        # Cross check with our own missed lists

								        print(f"Manually tracked missed parameters ({len(missed_params)}): {missed_params[:20]}...")

								        print(f"Manually tracked missed buffers ({len(missed_buffers)}): {missed_buffers[:20]}...")


								        # Check if all expected params/buffers in the model were loaded

								        all_model_keys = set(model_to_populate.state_dict().keys())

								        loaded_keys = set(new_state_dict.keys())

								        truly_missing_from_model = all_model_keys - loaded_keys

								        if truly_missing_from_model:

								            print(f"CRITICAL: Keys in model NOT found in source_dir ({len(truly_missing_from_model)}): {list(truly_missing_from_model)[:20]}...")


								        if not truly_missing_from_model and not result.unexpected_keys :

								             print("Successfully loaded weights from individual files into the model.")

								        else:

								            print("WARNING: Some weights might be missing or unexpected after loading from individual files.")

								            if not loaded_keys: # if we loaded nothing

								                 print("ERROR: No weights were successfully loaded from individual files. Aborting.")

								                 sys.exit(1)


								    else:

								        print("ERROR: No weights were found or loaded from individual files. Aborting.")

								        sys.exit(1)


								def export_jit_wrapped_tensors(model, output_dir):

								    TENSOR_KEY_IN_CONTAINER = "tensor" # The key used in TensorContainer and for C++ loading

								    if not os.path.exists(output_dir):

								        os.makedirs(output_dir); print(f"Created output directory: {output_dir}")


								    for name, param in model.named_parameters():

								        filename = name + '.pt'

								        filepath = os.path.join(output_dir, filename)

								        print(f"Exporting JIT-wrapped parameter: {name} (as {filename}) to {filepath} with shape {param.data.shape}")

								        container = TensorContainer(param.data.clone().detach().cpu(), TENSOR_KEY_IN_CONTAINER)

								        scripted_container = torch.jit.script(container)

								        torch.jit.save(scripted_container, filepath)


								    for name, buf in model.named_buffers():

								        filename = name + '.pt'

								        filepath = os.path.join(output_dir, filename)

								        print(f"Exporting JIT-wrapped buffer: {name} (as {filename}) to {filepath} with shape {buf.data.shape}")

								        container = TensorContainer(buf.data.clone().detach().cpu(), TENSOR_KEY_IN_CONTAINER)

								        scripted_container = torch.jit.script(container)

								        torch.jit.save(scripted_container, filepath)


								    print(f"All params/buffers exported as JIT-wrapped tensors to {output_dir} (using dot naming, key '{TENSOR_KEY_IN_CONTAINER}').")


								if __name__ == "__main__":

								    parser = argparse.ArgumentParser(description="Load ResNet-50 weights from a directory of individual underscore_named .pt files, then re-export them as JIT-wrapped (TensorContainer) dot_named .pt files for C++ loading.")

								    parser.add_argument('--source_individual_weights_dir', type=str, required=True,

								                        help="Directory containing the source underscore_named .pt files (e.g., 'exported_weights/backbone/').")

								    parser.add_argument('--output_jit_wrapped_tensors_dir', type=str, required=True,

								                        help="Directory to save the re-exported JIT-wrapped dot_named .pt files (e.g., 'exported_weights/raw_backbone/').")


								    args = parser.parse_args()


								    print("Instantiating a new ResNet-50 model (will be populated from source dir)...")

								    model = resnet50(output_layers=['layer4'], pretrained=False)

								    print("ResNet-50 model instantiated.")


								    load_weights_from_individual_files(model, args.source_individual_weights_dir)


								    export_jit_wrapped_tensors(model, args.output_jit_wrapped_tensors_dir)


								    print("Process complete. Weights loaded from source (underscore_named) and re-exported as JIT-wrapped tensors (dot_named).")