more elegant solution for deduplicating instruments

also edits help for deduplicate_instruments... to better explain what it
does; also fixes small typo ('default=' instead of 'default ='), row 448
This commit is contained in:
2026-02-17 16:02:14 +01:00
parent d83873c763
commit 3ae6b86b8e

View File

@@ -100,7 +100,9 @@ def chain_layer_to_target(layer_object):
def deduplicate_instruments_from_layers(layers): def deduplicate_instruments_from_layers(layers):
''' '''
Takes a list of Layer-class objects and for each layer gets the instruments used (laser, depo chamber and RHEED), returns deduplicated list. Ideally, the lists should only contain one element. Takes a list of Layer-class objects and for each layer gets the instruments used (laser, depo chamber and RHEED), returns dictionary with one item per category. This means that if more layers share the same instruments it returns a dictionary with just their names as strings (no lists or sub-dictionaries).
If different layers have different instruments (e.g. laser systems) the user is prompted to only select one.
''' '''
lasers = [] lasers = []
chambers = [] chambers = []
@@ -113,22 +115,54 @@ def deduplicate_instruments_from_layers(layers):
ded_lasers = list( set( lasers ) ) ded_lasers = list( set( lasers ) )
ded_chambers = list( set( chambers ) ) ded_chambers = list( set( chambers ) )
ded_rheeds = list( set( rheeds ) ) ded_rheeds = list( set( rheeds ) )
elegant_list = [ ded_lasers, ded_chambers, ded_rheeds] elegant_dict = {
if 0 in [ len(i) for i in elegant_list ]: # Keep key names human readable since they're used in the messages of the following errors
# i.e. if length of one of the lists in elegant_list is zero (missing data): "Laser Systems": ded_lasers,
raise IndexError("Missing data: no Laser System, Chamber and/or RHEED System is specified in any of the Deposition-type experiments related to this sample.") "Deposition Chamber": ded_chambers,
if not all([ len(i) == 1 for i in elegant_list ]): "RHEED Systems": ded_rheeds
} # dictionary's name's a joke
updated_dict = {} # use this for containing the final dataset
for ded in elegant_dict:
if len(elegant_dict[ded]) == 0:
# if len of list is 0 - empty list - raise error
raise IndexError(f"Missing data: no Laser System, Chamber and/or RHEED System is specified in any of the Deposition-type experiments related to this sample. Fix this on eLabFTW before retrying. Affected list: {ded}.")
elif len(elegant_dict[ded]) > 1:
# if len of list is > 1 - too many values - allow the user to pick one
print("Warning: different instruments have been used for different layers - which is currently not allowed.") print("Warning: different instruments have been used for different layers - which is currently not allowed.")
# for every element in elegant list check if len > 1 and if it is # there's a better way to do this but I can't remember now for the life of me...
print("Selecting the first occurence for every category...") i = 0
while i < len(elegant_dict[ded]):
print(f"{i} - {elegant_dict[ded][i]}")
i += 1
ans = None
while not type(ans) == int or not ans in range(0, len(elegant_dict[ded])):
ans = input("Please pick one of the previous (0, 1, ...) [default = 0]: ") or "0"
if ans.isdigit():
ans = int(ans)
continue # unnecessary?
updated_dict[ded] = elegant_dict[ded][ans]
elif elegant_dict[ded][0] in ["", 0, None]:
# if len is 1 BUT value is "", 0 or None raise error
raise ValueError(f"Missing data: a Laser System, Chamber and/or RHEED System which is specified across all the Deposition-type experiments related to this sample is either empty or invalid. Fix this on eLabFTW before retrying. Affected list: {ded}.")
else:
# if none of the previous (only 1 value), that single value is used
updated_dict[ded] = elegant_dict[ded][0]
instruments_used_dict = { instruments_used_dict = {
"laser_system": ded_lasers[0], "laser_system": updated_dict["Laser Systems"],
"deposition_chamber": ded_chambers[0], "deposition_chamber": updated_dict["Deposition Chamber"],
"rheed_system": ded_rheeds[0], "rheed_system": updated_dict["RHEED Systems"],
} }
return instruments_used_dict return instruments_used_dict
### OLD CODE
# if 0 in [ len(i) for i in elegant_list ]:
# # i.e. if length of one of the lists in elegant_list is zero (missing data):
# raise IndexError("Missing data: no Laser System, Chamber and/or RHEED System is specified in any of the Deposition-type experiments related to this sample.")
# if not all([ len(i) == 1 for i in elegant_list ]):
# print("Warning: different instruments have been used for different layers - which is currently not allowed.")
# # for every element in elegant list check if len > 1 and if it is
# print("Selecting the first occurence for every category...")
###
# lasers = { f"layer_{lyr.layer_number}": lyr.laser_system for lyr in layers } # lasers = { f"layer_{lyr.layer_number}": lyr.laser_system for lyr in layers }
# chambers = { f"layer_{lyr.layer_number}": lyr.deposition_chamber for lyr in layers } # chambers = { f"layer_{lyr.layer_number}": lyr.deposition_chamber for lyr in layers }
# rheeds = { f"layer_{lyr.layer_number}": lyr.rheed_system for lyr in layers } # rheeds = { f"layer_{lyr.layer_number}": lyr.rheed_system for lyr in layers }