diff --git a/aiidalab_eln/openbis/__init__.py b/aiidalab_eln/openbis/__init__.py index ac8b653..ce5674c 100644 --- a/aiidalab_eln/openbis/__init__.py +++ b/aiidalab_eln/openbis/__init__.py @@ -1,17 +1,18 @@ -from ..base_connector import ElnConnector -import traitlets as tl -from aiida import orm -import ipywidgets as ipw -import pybis as pb +import os from datetime import datetime -import os +import ipywidgets as ipw import numpy as np +import pybis as pb +import traitlets as tl +from aiida import orm, plugins +from ase import Atoms from rdkit import Chem from rdkit.Chem import AllChem -from ase import Atoms from sklearn.decomposition import PCA -from aiida import plugins + +from ..base_connector import ElnConnector + def make_ase(species, positions): """Create ase Atoms object.""" @@ -23,6 +24,7 @@ def make_ase(species, positions): return atoms + def _rdkit_opt(smiles, steps=1000): """Optimize a molecule using force field and rdkit (needed for complex SMILES).""" @@ -37,11 +39,12 @@ def _rdkit_opt(smiles, steps=1000): species = [mol.GetAtomWithIdx(j).GetSymbol() for j in range(natoms)] return make_ase(species, positions) + def import_smiles(sample): object_type = plugins.DataFactory("structure") node = object_type(ase=_rdkit_opt(sample.props.smiles)) return node - + class OpenbisElnConnector(ElnConnector): """OpenBIS ELN connector to AiiDAlab.""" @@ -81,7 +84,6 @@ def __init__(self, **kwargs): ) tl.link((self, "sample_uuid"), (self.sample_uuid_widget, "value")) - self.output = ipw.Output() super().__init__( @@ -98,18 +100,19 @@ def __init__(self, **kwargs): ], **kwargs, ) + def connect(self): """Function to login to openBIS.""" self.session = pb.Openbis(self.eln_instance, verify_certificates=False) self.session.set_token(self.token) return "" - + def set_sample_config(self, **kwargs): """Set sample-related variables from a config.""" for key, value in kwargs.items(): if hasattr(self, key) and key in ("file_name", "sample_uuid"): setattr(self, key, value) - + def get_config(self): return { "eln_instance": self.eln_instance, @@ -128,31 +131,31 @@ def is_connected(self): @tl.default("eln_type") def set_eln_type(self): # pylint: disable=no-self-use return "openbis" - + def sample_config_editor(self): return ipw.VBox( [ self.sample_uuid_widget, ] ) - + def get_all_structures_and_geoopts(self, node): """Get all atomistic models that led to the one used in the simulation""" current_node = node all_structures = [] all_geoopts = [] - + while current_node is not None: if isinstance(current_node, orm.StructureData): all_structures.append(current_node) current_node = current_node.creator - + elif isinstance(current_node, orm.CalcJobNode): current_node = current_node.caller - + elif isinstance(current_node, orm.CalcFunctionNode): current_node = current_node.inputs.source_structure - + elif isinstance(current_node, orm.WorkChainNode): if "GeoOpt" in current_node.label: all_geoopts.append(current_node) @@ -161,15 +164,15 @@ def get_all_structures_and_geoopts(self, node): current_node = current_node.inputs.structure else: current_node = current_node.caller - + return all_structures, all_geoopts - + def import_data(self): """Import data object from OpenBIS ELN to AiiDAlab.""" - + sample = self.extract_sample_id() - - #print("Sample", sample) + + # print("Sample", sample) if self.data_type == "smiles": self.node = import_smiles(sample) eln_info = { @@ -177,35 +180,53 @@ def import_data(self): "eln_type": self.eln_type, "sample_uuid": self.sample_uuid, "data_type": self.data_type, - "molecule_uuid": sample.permId + "molecule_uuid": sample.permId, } self.node.set_extra("eln", eln_info) self.node.store() - - def create_new_collection_openbis(self, project_code, collection_code, collection_type, collection_name): - collection = self.session.new_collection(project = project_code, code = collection_code, type = collection_type) + + def create_new_collection_openbis( + self, project_code, collection_code, collection_type, collection_name + ): + collection = self.session.new_collection( + project=project_code, code=collection_code, type=collection_type + ) collection.props["$name"] = collection_name collection.save() return collection def get_collection_openbis(self, collection_identifier): - return self.session.get_collection(code = collection_identifier) - + return self.session.get_collection(code=collection_identifier) + def check_if_collection_exists(self, project_code, collection_code): - return self.session.get_collections(project = project_code, code = collection_code).df.empty == False - - def create_collection_openbis(self, project_code, collection_name, collection_code, collection_type, collection_exists): + return ( + self.session.get_collections( + project=project_code, code=collection_code + ).df.empty + == False + ) + + def create_collection_openbis( + self, + project_code, + collection_name, + collection_code, + collection_type, + collection_exists, + ): if collection_exists == False: - collection = self.create_new_collection_openbis(project_code, collection_code, collection_type, collection_name) + collection = self.create_new_collection_openbis( + project_code, collection_code, collection_type, collection_name + ) else: collection_identifier = f"{project_code}/{collection_code}" collection = self.get_collection_openbis(collection_identifier) - + return collection - + def get_objects_list_openbis(self, object_type): - return self.session.get_objects(type = object_type) - + return self.session.get_objects(type=object_type) + def check_aiida_objects_in_openbis(self, aiida_objects, openbis_objects): aiida_objects_inside_openbis = [] # Verify which AiiDA objects are already in openBIS @@ -215,25 +236,39 @@ def check_aiida_objects_in_openbis(self, aiida_objects, openbis_objects): if openbis_object.props.get("wfms-uuid") == aiida_object.uuid: aiida_objects_inside_openbis.append([openbis_object, True]) aiida_object_inside_openbis_exists = True - print(f"Object {openbis_object.props.get('wfms-uuid')} already exists.") + print( + f"Object {openbis_object.props.get('wfms-uuid')} already exists." + ) if aiida_object_inside_openbis_exists == False: aiida_objects_inside_openbis.append([None, False]) - + # Reverse the lists because in openBIS, one should start by building the parents. aiida_objects.reverse() aiida_objects_inside_openbis.reverse() - + return aiida_objects, aiida_objects_inside_openbis - def create_new_object_openbis(self, collection_identifier, object_type, parents = None): + def create_new_object_openbis( + self, collection_identifier, object_type, parents=None + ): if parents == None: - return self.session.new_sample(collection = collection_identifier, type = object_type) + return self.session.new_sample( + collection=collection_identifier, type=object_type + ) else: - return self.session.new_sample(collection = collection_identifier, type = object_type, parents = parents) - - def set_object_props(self, aiida_object_index, aiida_object, number_aiida_objects, openbis_object_type): - + return self.session.new_sample( + collection=collection_identifier, type=object_type, parents=parents + ) + + def set_object_props( + self, + aiida_object_index, + aiida_object, + number_aiida_objects, + openbis_object_type, + ): + if openbis_object_type == "ATOMISTIC_MODEL": # Get Structure details from AiiDA structure_ase = aiida_object.get_ase() @@ -241,207 +276,275 @@ def set_object_props(self, aiida_object_index, aiida_object, number_aiida_object # structure_ase.symbols # Atoms Symbols # structure_ase.pbc # PBC (X, Y, Z) # structure.cell # Cell vectors - + object_props = { "$name": f"Atomistic Model {aiida_object_index}", "wfms-uuid": aiida_object.uuid, "pbc-x": int(structure_ase.pbc[0]), "pbc-y": int(structure_ase.pbc[1]), - "pbc-z": int(structure_ase.pbc[2]) + "pbc-z": int(structure_ase.pbc[2]), } - - if number_aiida_objects > 1 and aiida_object_index == number_aiida_objects - 1: # If it is the last of more than one structures, it is optimised. + + if ( + number_aiida_objects > 1 + and aiida_object_index == number_aiida_objects - 1 + ): # If it is the last of more than one structures, it is optimised. object_props["optimised"] = 1 else: object_props["optimised"] = 0 - + return object_props - - def create_atomistic_models(self, structures_nodes, structures_inside_openbis, collection_identifier): + + def create_atomistic_models( + self, structures_nodes, structures_inside_openbis, collection_identifier + ): atomistic_models = [] selected_molecule = None - + for structure_index, structure in enumerate(structures_nodes): - + # If the structure contains a molecule, save it as a parent of the previous atomistic model because it is the molecule that started all the simulation if "eln" in structure.base.extras.all: - selected_molecule = self.session.get_sample(structure.base.extras.all["eln"]["molecule_uuid"]) + selected_molecule = self.session.get_sample( + structure.base.extras.all["eln"]["molecule_uuid"] + ) else: structure_inside_openbis = structures_inside_openbis[structure_index] - + if structure_inside_openbis[1] == False: # Create Atomistic Model in openBIS number_aiida_objects = len(structures_nodes) - atomistic_model = self.create_new_object_openbis(collection_identifier, "ATOMISTIC_MODEL") - atomistic_model.props = self.set_object_props(structure_index, structure, number_aiida_objects, "ATOMISTIC_MODEL") + atomistic_model = self.create_new_object_openbis( + collection_identifier, "ATOMISTIC_MODEL" + ) + atomistic_model.props = self.set_object_props( + structure_index, + structure, + number_aiida_objects, + "ATOMISTIC_MODEL", + ) atomistic_model.save() atomistic_models.append(atomistic_model) else: atomistic_models.append(structure_inside_openbis[0]) - + # If the simulation started from openBIS, we make the connection between the molecule and the first atomistic model # If the atomistic model (second structure, right after the molecule) is already there, there is no need to make the connection, because in principle it already contains it if selected_molecule is not None and structures_inside_openbis[1][1] == False: atomistic_models[0].add_parents(selected_molecule) atomistic_models[0].save() - + return atomistic_models - def create_geoopts_simulations(self, geoopts_nodes, geoopts_inside_openbis, collection_identifier, atomistic_models): + def create_geoopts_simulations( + self, + geoopts_nodes, + geoopts_inside_openbis, + collection_identifier, + atomistic_models, + ): geoopts_simulations = [] - + for geoopt_index, geoopt in enumerate(geoopts_nodes): geoopt_inside_openbis = geoopts_inside_openbis[geoopt_index] - + if geoopt_inside_openbis[1] == False: parent_atomistic_model = atomistic_models[geoopt_index] - geoopt_simulation = self.create_new_object_openbis(collection_identifier, "SIMULATION", [parent_atomistic_model]) + geoopt_simulation = self.create_new_object_openbis( + collection_identifier, "SIMULATION", [parent_atomistic_model] + ) geoopt_simulation.props = { "$name": f"GeoOpt Simulation {geoopt_index}", - "wfms-uuid": geoopt.uuid + "wfms-uuid": geoopt.uuid, } geoopt_simulation.save() - - geoopt_model = self.create_new_object_openbis(collection_identifier, "GEO_OPTIMISATION", [geoopt_simulation]) + + geoopt_model = self.create_new_object_openbis( + collection_identifier, "GEO_OPTIMISATION", [geoopt_simulation] + ) geoopt_model.save() - + # Its plus one because there are N+1 geometries for N GeoOpts atomistic_models[geoopt_index + 1].add_parents(geoopt_model) atomistic_models[geoopt_index + 1].save() - + geoopts_simulations.append(geoopt_simulation) else: geoopts_simulations.append(geoopt_inside_openbis[0]) - + return geoopts_simulations, atomistic_models - def create_stm_simulations(self, stms_nodes, stms_inside_openbis, collection_identifier, atomistic_models): + def create_stm_simulations( + self, stms_nodes, stms_inside_openbis, collection_identifier, atomistic_models + ): stms_simulations = [] - + for stm_index, stm in enumerate(stms_nodes): stm_inside_openbis = stms_inside_openbis[stm_index] - + if stms_inside_openbis[0][1] == False: - + optimised_atomistic_model = atomistic_models[-1] - + # Simulation object - stm_simulation = self.create_new_object_openbis(collection_identifier, "SIMULATION", [optimised_atomistic_model]) + stm_simulation = self.create_new_object_openbis( + collection_identifier, "SIMULATION", [optimised_atomistic_model] + ) stm_simulation.props = { "$name": f"STM Simulation {stm_index}", "description": "STM Simulation", - "wfms-uuid": stm.uuid + "wfms-uuid": stm.uuid, } stm_simulation.save() # Simulated STM - stm_model = self.create_new_object_openbis(collection_identifier, "STM", [stm_simulation]) + stm_model = self.create_new_object_openbis( + collection_identifier, "STM", [stm_simulation] + ) # dft_params = dict(self.node.inputs.dft_params) - - #TODO: Remove this is the future. Orbitals do not have stm_params + + # TODO: Remove this is the future. Orbitals do not have stm_params try: stm_params = dict(stm.inputs.spm_params) stm_model.props = { - "emin-j": float(stm_params['--energy_range'][0]) * 1.60217663e-19, - "emax-j": float(stm_params['--energy_range'][1]) * 1.60217663e-19, - "de-j": float(stm_params['--energy_range'][2]) * 1.60217663e-19 + "emin-j": float(stm_params["--energy_range"][0]) + * 1.60217663e-19, + "emax-j": float(stm_params["--energy_range"][1]) + * 1.60217663e-19, + "de-j": float(stm_params["--energy_range"][2]) * 1.60217663e-19, } except: pass - - stm_model.props['$name'] = f"Simulated STM {stm_index}" + + stm_model.props["$name"] = f"Simulated STM {stm_index}" stm_model.save() - + # stm_simulation_images_zip_filename = series_plotter_inst.create_zip_link_for_openbis() - + # stm_simulation_images_dataset = self.session.new_dataset( - # type = "RAW_DATA", + # type = "RAW_DATA", # files = [stm_simulation_images_zip_filename], # sample = stm_simulation_model # ) # stm_simulation_images_dataset.save() - #TODO: How to do this using Python commands? + # TODO: How to do this using Python commands? stm_simulation_dataset_filename = "stm_simulation.aiida" - os.system(f"verdi archive create {stm_simulation_dataset_filename} --no-call-calc-backward --no-call-work-backward --no-create-backward -N {stm.pk}") + os.system( + f"verdi archive create {stm_simulation_dataset_filename} --no-call-calc-backward --no-call-work-backward --no-create-backward -N {stm.pk}" + ) stm_simulation_dataset = self.session.new_dataset( - type = "RAW_DATA", - files = [stm_simulation_dataset_filename], - sample = stm_model + type="RAW_DATA", + files=[stm_simulation_dataset_filename], + sample=stm_model, ) stm_simulation_dataset.save() - + # Delete the file after uploading os.remove(stm_simulation_dataset_filename) - + stms_simulations.append(stm_model) else: stms_simulations.append(stm_inside_openbis[0]) - + return stms_simulations - + def export_data(self): """Export AiiDA object (node attribute of this class) to ELN.""" # Get experiment from openBIS selected_experiment = self.session.get_experiment(self.sample_uuid) - + # Create a collection for storing atomistic models in openBIS if it is not already there inventory_project_code = "/MATERIALS/ATOMISTIC_MODELS" atomistic_models_collection_name = "Atomistic Models" atomistic_models_collection_type = "COLLECTION" atomistic_models_collection_code = "ATOMISTIC_MODELS_COLLECTION" - atomistic_models_collection_identifier = f"{inventory_project_code}/{atomistic_models_collection_code}" - - atomistic_models_collection_exists = self.check_if_collection_exists(inventory_project_code, atomistic_models_collection_code) - _ = self.create_collection_openbis(inventory_project_code, atomistic_models_collection_name, atomistic_models_collection_code, atomistic_models_collection_type, atomistic_models_collection_exists) - + atomistic_models_collection_identifier = ( + f"{inventory_project_code}/{atomistic_models_collection_code}" + ) + + atomistic_models_collection_exists = self.check_if_collection_exists( + inventory_project_code, atomistic_models_collection_code + ) + _ = self.create_collection_openbis( + inventory_project_code, + atomistic_models_collection_name, + atomistic_models_collection_code, + atomistic_models_collection_type, + atomistic_models_collection_exists, + ) + # Get all simulations and atomistic models from openbis simulations_openbis = self.get_objects_list_openbis("SIMULATION") atomistic_models_openbis = self.get_objects_list_openbis("ATOMISTIC_MODEL") - + # Get Geometry Optimisation Workchain from AiiDA - all_structures, all_aiida_geoopts = self.get_all_structures_and_geoopts(self.node) - + all_structures, all_aiida_geoopts = self.get_all_structures_and_geoopts( + self.node + ) + # Verify which GeoOpts are already in openBIS - all_aiida_geoopts, all_geoopts_inside_openbis = self.check_aiida_objects_in_openbis(all_aiida_geoopts, simulations_openbis) - + all_aiida_geoopts, all_geoopts_inside_openbis = ( + self.check_aiida_objects_in_openbis(all_aiida_geoopts, simulations_openbis) + ) + # Verify which structures (atomistic models) are already in openBIS - all_structures, all_structures_inside_openbis = self.check_aiida_objects_in_openbis(all_structures, atomistic_models_openbis) - + all_structures, all_structures_inside_openbis = ( + self.check_aiida_objects_in_openbis( + all_structures, atomistic_models_openbis + ) + ) + # Get the project identifier of the selected experiment # project_identifier = selected_experiment.project.identifier - + # Create a new simulation experiment in openBIS # now = datetime.now() # simulation_number = now.strftime("%d%m%Y%H%M%S") # simulation_experiment_code = f"SIMULATION_EXPERIMENT_{simulation_number}" # simulation_experiment_name = "Simulation of Methane on Au" # simulation_experiment = self.get_collection_openbis(self.sample_uuid) - - #TODO: Do we need to create a simulation experiment or do we put the simulations inside the selected experiment? + + # TODO: Do we need to create a simulation experiment or do we put the simulations inside the selected experiment? simulation_experiment_identifier = selected_experiment.identifier - + # Build atomistic models (structures in AiiDA) in openBIS - all_atomistic_models = self.create_atomistic_models(all_structures, all_structures_inside_openbis, atomistic_models_collection_identifier) - + all_atomistic_models = self.create_atomistic_models( + all_structures, + all_structures_inside_openbis, + atomistic_models_collection_identifier, + ) + # Build GeoOpts in openBIS - all_geoopts_simulations, all_atomistic_models = self.create_geoopts_simulations(all_aiida_geoopts, all_geoopts_inside_openbis, simulation_experiment_identifier, all_atomistic_models) - + all_geoopts_simulations, all_atomistic_models = self.create_geoopts_simulations( + all_aiida_geoopts, + all_geoopts_inside_openbis, + simulation_experiment_identifier, + all_atomistic_models, + ) + if isinstance(self.node, orm.WorkChainNode): - + # Get structure used in the Workchain all_aiida_stms = [self.node] - + # Verify which structures (atomistic models) are already in openBIS - all_aiida_stms, all_stms_inside_openbis = self.check_aiida_objects_in_openbis(all_aiida_stms, simulations_openbis) - + all_aiida_stms, all_stms_inside_openbis = ( + self.check_aiida_objects_in_openbis(all_aiida_stms, simulations_openbis) + ) + # Build STM Simulations in openBIS - all_stms_simulations = self.create_stm_simulations(all_aiida_stms, all_stms_inside_openbis, simulation_experiment_identifier, all_atomistic_models) - + all_stms_simulations = self.create_stm_simulations( + all_aiida_stms, + all_stms_inside_openbis, + simulation_experiment_identifier, + all_atomistic_models, + ) + def extract_sample_id(self): - + experiment = self.session.get_experiment(self.sample_uuid) samples = experiment.get_samples() @@ -456,6 +559,5 @@ def extract_sample_id(self): if parent_sample.type.code == "MOLECULE": molecule_sample = self.session.get_sample(parent_sample.permId) break - - return molecule_sample + return molecule_sample