Compare commits
14 Commits
207d166227
...
dev
| Author | SHA256 | Date | |
|---|---|---|---|
| 1523c973f4 | |||
| 5cf67648af | |||
| 839799a13f | |||
| 10c68bf260 | |||
| bab5e958cb | |||
| fc150be724 | |||
| aa3bf531f9 | |||
| 3f97ccee25 | |||
| 3ae6b86b8e | |||
| d83873c763 | |||
| de401b5474 | |||
| fde2615107 | |||
| 59e173c54f | |||
| 712cbc4788 |
@@ -1,62 +0,0 @@
|
||||
"""
|
||||
Currently unused!
|
||||
"""
|
||||
import json, requests
|
||||
from APIHandler import APIHandler
|
||||
|
||||
def get_entry_from_elabid(elabid, entryType="items"):
|
||||
'''
|
||||
Function which returns entrypoint data (as dictionary) from its elabid.
|
||||
'''
|
||||
header = APIHandler(apikey).dump
|
||||
response = requests.get(
|
||||
headers = header,
|
||||
url = f"{ELABFTW_API_URL}/{entryType}/{elabid}",
|
||||
verify=True
|
||||
)
|
||||
if response.status_code // 100 in [2,3]:
|
||||
entry_data = response.json()
|
||||
return entry_data
|
||||
else:
|
||||
raise ConnectionError(f"HTTP request failed with status code: {response.status_code}.")
|
||||
|
||||
def get_sample_layers_data(elabid):
|
||||
'''
|
||||
Return the following data from every eLabFTW experiment linked
|
||||
to a certain sample, identified by elabid.
|
||||
|
||||
- Title of the experiment
|
||||
- Category (should check it's "PLD Deposition")
|
||||
- Layer number - if present (PLD depositions)
|
||||
- Deposition time - returns error if not present
|
||||
- Repetition rate - returns error if not present
|
||||
'''
|
||||
# header = {
|
||||
# "Authorization": apikey,
|
||||
# "Content-Type": "application/json"
|
||||
# }
|
||||
sample_data = requests.get(
|
||||
headers = header,
|
||||
url = f"https://elabftw.fisica.unina.it/api/v2/items/{elabid}",
|
||||
verify=True
|
||||
).json()
|
||||
related_experiments = sample_data["related_experiments_links"]
|
||||
result = []
|
||||
for exp in related_experiments:
|
||||
experiment_data = requests.get(
|
||||
headers = header,
|
||||
url = f"https://elabftw.fisica.unina.it/api/v2/experiments/{exp.get("entityid")}",
|
||||
verify=True
|
||||
).json()
|
||||
extra = experiment_data["metadata_decoded"]["extra_fields"]
|
||||
result.append(
|
||||
{"title": exp.get("title"),
|
||||
"layer_number": extra.get("Layer Progressive Number").get("value"),
|
||||
"category": exp.get("category_title"),
|
||||
"deposition_time": extra.get("Duration").get("value"),
|
||||
"repetition_rate": extra.get("Repetition rate").get("value")}
|
||||
)
|
||||
return result
|
||||
|
||||
if __name__=="__main__":
|
||||
print("Warning: you're not supposed to be running this as the main program.")
|
||||
241
src/main.py
241
src/main.py
@@ -1,4 +1,5 @@
|
||||
import os, json, requests, h5py
|
||||
import numpy as np
|
||||
from getpass import getpass
|
||||
from APIHandler import APIHandler
|
||||
from classes import *
|
||||
@@ -100,21 +101,75 @@ def chain_layer_to_target(layer_object):
|
||||
|
||||
def deduplicate_instruments_from_layers(layers):
|
||||
'''
|
||||
Takes a list of Layer-class objects and for each layer gets the instruments used (laser, depo chamber and RHEED), returns deduplicated list. Ideally, the lists should only contain one element.
|
||||
Takes a list of Layer-class objects and for each layer gets the instruments used (laser, depo chamber and RHEED), returns dictionary with one item per category. This means that if more layers share the same instruments it returns a dictionary with just their names as strings (no lists or sub-dictionaries).
|
||||
|
||||
If different layers have different instruments (e.g. laser systems) the user is prompted to only select one.
|
||||
'''
|
||||
lasers = []
|
||||
chambers = []
|
||||
rheeds = []
|
||||
elegant_dict = {}
|
||||
for lyr in layers:
|
||||
instruments = lyr.get_instruments(apikey)
|
||||
lasers.append(instruments["laser_system"])
|
||||
chambers.append(instruments["deposition_chamber"])
|
||||
rheeds.append(instruments["rheed_system"])
|
||||
instruments_used_dict = {
|
||||
"laser_system": list( set( lasers ) ),
|
||||
"deposition_chamber": list( set( chambers ) ),
|
||||
"rheed_system" : list( set( rheeds ) ),
|
||||
}
|
||||
elegant_dict[f"layer_{lyr.layer_number}"] = {
|
||||
"laser_system": instruments["laser_system"],
|
||||
"deposition_chamber": instruments["deposition_chamber"],
|
||||
"rheed_system": instruments["rheed_system"],
|
||||
}
|
||||
ded_lasers = list( set( lasers ) )
|
||||
ded_chambers = list( set( chambers ) )
|
||||
ded_rheeds = list( set( rheeds ) )
|
||||
elegant_dict["multilayer"] = {
|
||||
# Keep key names human readable since they're used in the messages of the following errors
|
||||
"laser_system": ", ".join(ded_lasers),
|
||||
"deposition_chamber": ", ".join(ded_chambers),
|
||||
"rheed_system": ", ".join(ded_rheeds)
|
||||
} # dictionary's name is a joke
|
||||
# updated_dict = {} # use this for containing the final dataset
|
||||
# for ded in elegant_dict:
|
||||
# if len(elegant_dict[ded]) == 0:
|
||||
# # if len of list is 0 - empty list - raise error
|
||||
# raise IndexError(f"Missing data: no Laser System, Chamber and/or RHEED System is specified in any of the Deposition-type experiments related to this sample. Fix this on eLabFTW before retrying. Affected list: {ded}.")
|
||||
# elif len(elegant_dict[ded]) > 1:
|
||||
# # if len of list is > 1 - too many values - allow the user to pick one
|
||||
# print("Warning: different instruments have been used for different layers - which is currently not allowed.")
|
||||
# # there's a better way to do this but I can't remember now for the life of me...
|
||||
# i = 0
|
||||
# while i < len(elegant_dict[ded]):
|
||||
# print(f"{i} - {elegant_dict[ded][i]}")
|
||||
# i += 1
|
||||
# ans = None
|
||||
# while not type(ans) == int or not ans in range(0, len(elegant_dict[ded])):
|
||||
# ans = input("Please pick one of the previous (0, 1, ...) [default = 0]: ") or "0"
|
||||
# if ans.isdigit():
|
||||
# ans = int(ans)
|
||||
# continue # unnecessary?
|
||||
# updated_dict[ded] = elegant_dict[ded][ans]
|
||||
# elif elegant_dict[ded][0] in ["", 0, None]:
|
||||
# # if len is 1 BUT value is "", 0 or None raise error
|
||||
# raise ValueError(f"Missing data: a Laser System, Chamber and/or RHEED System which is specified across all the Deposition-type experiments related to this sample is either empty or invalid. Fix this on eLabFTW before retrying. Affected list: {ded}.")
|
||||
# else:
|
||||
# # if none of the previous (only 1 value), that single value is used
|
||||
# updated_dict[ded] = elegant_dict[ded][0]
|
||||
# instruments_used_dict = {
|
||||
# "laser_system": updated_dict["Laser Systems"],
|
||||
# "deposition_chamber": updated_dict["Deposition Chamber"],
|
||||
# "rheed_system": updated_dict["RHEED Systems"],
|
||||
# }
|
||||
return elegant_dict
|
||||
|
||||
### OLD CODE
|
||||
# if 0 in [ len(i) for i in elegant_list ]:
|
||||
# # i.e. if length of one of the lists in elegant_list is zero (missing data):
|
||||
# raise IndexError("Missing data: no Laser System, Chamber and/or RHEED System is specified in any of the Deposition-type experiments related to this sample.")
|
||||
# if not all([ len(i) == 1 for i in elegant_list ]):
|
||||
# print("Warning: different instruments have been used for different layers - which is currently not allowed.")
|
||||
# # for every element in elegant list check if len > 1 and if it is
|
||||
# print("Selecting the first occurence for every category...")
|
||||
###
|
||||
# lasers = { f"layer_{lyr.layer_number}": lyr.laser_system for lyr in layers }
|
||||
# chambers = { f"layer_{lyr.layer_number}": lyr.deposition_chamber for lyr in layers }
|
||||
# rheeds = { f"layer_{lyr.layer_number}": lyr.rheed_system for lyr in layers }
|
||||
@@ -123,12 +178,52 @@ def deduplicate_instruments_from_layers(layers):
|
||||
# "deposition_chamber": chambers,
|
||||
# "rheed_system": rheeds,
|
||||
# }
|
||||
return instruments_used_dict
|
||||
|
||||
def analyse_rheed_data(data):
|
||||
'''
|
||||
Takes the content of a tsv file and returns a dictionary with timestamps and intensities.
|
||||
The file should contain a 2D array composed of 4 columns - where the first column is a timestamp and the other three are RHEED intensities - and an unspecified number of rows.
|
||||
|
||||
-----
|
||||
Time Layer1_Int1 Layer1_Int2 Layer1_Int3
|
||||
-----
|
||||
|
||||
Distinct ValueErrors are raised if:
|
||||
- The array is not 2-dimensional;
|
||||
- The total number of columns does not equate exactly 1+3 (= 4).
|
||||
|
||||
Time is expressed in seconds, intensities are normalized (adimensional).
|
||||
|
||||
# TO-DO: complete this description...
|
||||
Written with help from DeepSeek.
|
||||
'''
|
||||
# Verifying the format of the input file:
|
||||
if data.ndim != 2:
|
||||
raise ValueError(f"Unexpected trace format: expected 2D array, got ndim = {data.ndim}.")
|
||||
n_cols = data.shape[1] # 0 = rows, 1 = columns
|
||||
if n_cols > 4:
|
||||
print(f"Warning! The input file (for Realtime Window Analysis) has {n_cols-4} more than needed.\nOnly 4 columns will be considered - with the first representing time and the others representing RHEED intensities.")
|
||||
if n_cols < 4:
|
||||
raise ValueError(f"Insufficient number of columns: expected 4, got n_cols = {n_cols}.")
|
||||
n_time_points = data.shape[0]
|
||||
|
||||
# Get time (all rows of col 0) as Float64:
|
||||
time = data[:, 0].astype(np.float64, copy=False) # copy=False suggested by LLM for mem. eff.
|
||||
|
||||
# Get intensities (all rows of cols 1,2,3) as Float32:
|
||||
intensities = data[:, 1:4].astype(np.float32, copy=False)
|
||||
|
||||
return {
|
||||
"time": time,
|
||||
"intensity": intensities,
|
||||
}
|
||||
|
||||
|
||||
def make_nexus_schema_dictionary(substrate_object, layers):
|
||||
'''
|
||||
Main function, takes all the other functions to reconstruct the full dataset. Takes a Substrate-class object (output of the chain_entrypoint_to_batch() function) and a list of Layer-class objects (output of the chain_entrypoint_to_layers() function), returns dictionary with the same schema as the NeXus standard for PLD fabrications.
|
||||
'''
|
||||
instruments = deduplicate_instruments_from_layers(layers)
|
||||
pld_fabrication = {
|
||||
"sample": {
|
||||
"substrate": {
|
||||
@@ -151,7 +246,7 @@ def make_nexus_schema_dictionary(substrate_object, layers):
|
||||
},
|
||||
"multilayer": {},
|
||||
},
|
||||
"instruments_used": deduplicate_instruments_from_layers(layers),
|
||||
"instruments_used": instruments["multilayer"],
|
||||
}
|
||||
multilayer = pld_fabrication["sample"]["multilayer"]
|
||||
for layer in layers:
|
||||
@@ -251,10 +346,11 @@ def make_nexus_schema_dictionary(substrate_object, layers):
|
||||
"units": layer.post_annealing_duration_unit,
|
||||
},
|
||||
},
|
||||
"instruments_used": instruments[name],
|
||||
}
|
||||
return pld_fabrication
|
||||
|
||||
def build_nexus_file(pld_fabrication, output_path):
|
||||
def build_nexus_file(pld_fabrication, output_path, rheed_osc=None):
|
||||
# NOTE: look at the mail attachment from Emiliano...
|
||||
with h5py.File(output_path, "w") as f:
|
||||
nx_pld_entry = f.create_group("pld_fabrication")
|
||||
@@ -297,29 +393,39 @@ def build_nexus_file(pld_fabrication, output_path):
|
||||
nx_layer.attrs["NX_class"] = "NXsubentry"
|
||||
layer_dict = multilayer_dict[layer]
|
||||
# Sub-groups of a layer
|
||||
## Target
|
||||
nx_target = nx_layer.create_group("target")
|
||||
nx_target.attrs["NX_class"] = "NXsample"
|
||||
target_dict = layer_dict["target"]
|
||||
## Rastering and Annealing
|
||||
nx_laser_rastering = nx_layer.create_group("laser_rastering")
|
||||
nx_pre_annealing = nx_layer.create_group("pre_annealing")
|
||||
nx_post_annealing = nx_layer.create_group("post_annealing")
|
||||
nx_laser_rastering.attrs["NX_class"] = "NXprocess"
|
||||
rastering_dict = layer_dict["laser_rastering"]
|
||||
nx_pre_annealing = nx_layer.create_group("pre_annealing")
|
||||
nx_pre_annealing.attrs["NX_class"] = "NXprocess"
|
||||
pre_ann_dict = layer_dict["pre_annealing"]
|
||||
nx_post_annealing = nx_layer.create_group("post_annealing")
|
||||
nx_post_annealing.attrs["NX_class"] = "NXprocess"
|
||||
post_ann_dict = layer_dict["post_annealing"]
|
||||
nx_layer_instruments = nx_layer.create_group("instruments_used")
|
||||
nx_layer_instruments.attrs["NX_class"] = "NXinstrument"
|
||||
layer_instruments_dict = layer_dict["instruments_used"]
|
||||
|
||||
## Target metadata
|
||||
try:
|
||||
nx_target.create_dataset("name", data=target_dict["name"])
|
||||
nx_target.create_dataset("chemical_formula", data=target_dict["chemical_formula"])
|
||||
nx_target.create_dataset("description", data=target_dict["description"])
|
||||
nx_target.create_dataset("shape", data=target_dict["shape"])
|
||||
nx_target.create_dataset("dimensions", data=target_dict["dimensions"])
|
||||
nx_target.create_dataset("thickness", data=target_dict["thickness"]["value"]) # float/int
|
||||
nx_target.create_dataset("name", data = target_dict["name"])
|
||||
nx_target.create_dataset("chemical_formula", data = target_dict["chemical_formula"])
|
||||
nx_target.create_dataset("description", data = target_dict["description"])
|
||||
nx_target.create_dataset("shape", data = target_dict["shape"])
|
||||
nx_target.create_dataset("dimensions", data = target_dict["dimensions"])
|
||||
nx_target.create_dataset("thickness", data = target_dict["thickness"]["value"]) # float/int
|
||||
nx_target["thickness"].attrs["units"] = target_dict["thickness"]["units"]
|
||||
nx_target.create_dataset("solid_form", data=target_dict["solid_form"])
|
||||
nx_target.create_dataset("manufacturer", data=target_dict["manufacturer"])
|
||||
nx_target.create_dataset("batch_id", data=target_dict["batch_id"])
|
||||
nx_target.create_dataset("solid_form", data = target_dict["solid_form"])
|
||||
nx_target.create_dataset("manufacturer", data = target_dict["manufacturer"])
|
||||
nx_target.create_dataset("batch_id", data = target_dict["batch_id"])
|
||||
except TypeError as te:
|
||||
raise TypeError(te)
|
||||
## Other layer-specific metadata
|
||||
try:
|
||||
nx_layer.create_dataset("start_time", data = layer_dict["start_time"])
|
||||
nx_layer.create_dataset("operator", data = layer_dict["operator"])
|
||||
@@ -346,20 +452,111 @@ def build_nexus_file(pld_fabrication, output_path):
|
||||
nx_layer["laser_energy"].attrs["units"] = layer_dict["laser_energy"]["units"]
|
||||
except TypeError as te:
|
||||
raise TypeError(te)
|
||||
## Rastering metadata
|
||||
try:
|
||||
nx_laser_rastering.create_dataset("geometry", data = rastering_dict["geometry"])
|
||||
nx_laser_rastering.create_dataset("positions", data = rastering_dict["positions"])
|
||||
nx_laser_rastering.create_dataset("velocities", data = rastering_dict["velocities"])
|
||||
except TypeError as te:
|
||||
raise TypeError(te)
|
||||
## Annealing metadata
|
||||
try:
|
||||
nx_pre_annealing.create_dataset("ambient_gas", data = pre_ann_dict["ambient_gas"])
|
||||
nx_pre_annealing.create_dataset("pressure", data = pre_ann_dict["pressure"]["value"])
|
||||
nx_pre_annealing["pressure"].attrs["units"] = pre_ann_dict["pressure"]["units"]
|
||||
nx_pre_annealing.create_dataset("temperature", data = pre_ann_dict["temperature"]["value"])
|
||||
nx_pre_annealing["temperature"].attrs["units"] = pre_ann_dict["temperature"]["units"]
|
||||
nx_pre_annealing.create_dataset("duration", data = pre_ann_dict["duration"]["value"])
|
||||
nx_pre_annealing["duration"].attrs["units"] = pre_ann_dict["duration"]["units"]
|
||||
except TypeError as te:
|
||||
raise TypeError(te)
|
||||
try:
|
||||
nx_post_annealing.create_dataset("ambient_gas", data = post_ann_dict["ambient_gas"])
|
||||
nx_post_annealing.create_dataset("pressure", data = post_ann_dict["pressure"]["value"])
|
||||
nx_post_annealing["pressure"].attrs["units"] = post_ann_dict["pressure"]["units"]
|
||||
nx_post_annealing.create_dataset("temperature", data = post_ann_dict["temperature"]["value"])
|
||||
nx_post_annealing["temperature"].attrs["units"] = post_ann_dict["temperature"]["units"]
|
||||
nx_post_annealing.create_dataset("duration", data = post_ann_dict["duration"]["value"])
|
||||
nx_post_annealing["duration"].attrs["units"] = post_ann_dict["duration"]["units"]
|
||||
except TypeError as te:
|
||||
raise TypeError(te)
|
||||
try:
|
||||
nx_layer_instruments.create_dataset("laser_system", data = layer_instruments_dict["laser_system"])
|
||||
nx_layer_instruments.create_dataset("deposition_chamber", data = layer_instruments_dict["deposition_chamber"])
|
||||
nx_layer_instruments.create_dataset("rheed_system", data = layer_instruments_dict["rheed_system"])
|
||||
except TypeError as te:
|
||||
raise TypeError(te)
|
||||
|
||||
# Instruments used section
|
||||
nx_instruments = nx_pld_entry.create_group("instruments_used")
|
||||
nx_instruments.attrs["NX_class"] = "NXinstrument"
|
||||
instruments_dict = pld_fabrication["instruments_used"]
|
||||
try:
|
||||
nx_instruments.create_dataset("laser_system", data = instruments_dict["laser_system"])
|
||||
nx_instruments.create_dataset("deposition_chamber", data = instruments_dict["deposition_chamber"])
|
||||
nx_instruments.create_dataset("rheed_system", data = instruments_dict["rheed_system"])
|
||||
except TypeError as te:
|
||||
raise TypeError(te)
|
||||
|
||||
# RHEED data section
|
||||
if rheed_osc is not None:
|
||||
nx_rheed = nx_pld_entry.create_group("rheed_data")
|
||||
nx_rheed.attrs["NX_class"] = "NXdata"
|
||||
|
||||
# Asse temporale
|
||||
t_ds = nx_rheed.create_dataset("time", data=rheed_osc["time"])
|
||||
t_ds.attrs["units"] = "s"
|
||||
t_ds.attrs["long_name"] = "Time"
|
||||
|
||||
# Intensità: shape (n_layers, n_timepoints, 3)
|
||||
i_ds = nx_rheed.create_dataset("intensity", data=rheed_osc["intensity"])
|
||||
i_ds.attrs["units"] = "a.u."
|
||||
i_ds.attrs["long_name"] = "RHEED Intensity"
|
||||
|
||||
# Attributi NXdata — notazione NeXus 3.x corretta
|
||||
nx_rheed.attrs["signal"] = "intensity"
|
||||
nx_rheed.attrs["axes"] = [".", "time", "."] # solo l'asse 1 (time) è denominato
|
||||
nx_rheed.attrs["time_indices"] = np.array([1], dtype=np.int32)
|
||||
# ###########
|
||||
# nx_rheed = nx_pld_entry.create_group("rheed_data")
|
||||
# nx_rheed.attrs["NX_class"] = "NXdata"
|
||||
|
||||
# nx_rheed.create_dataset("time", data=rheed_osc["time"])
|
||||
# nx_rheed["time"].attrs["units"] = "s"
|
||||
|
||||
# nx_rheed.create_dataset("intensity", data=rheed_osc["intensity"])
|
||||
# #nx_rheed["intensity"].attrs["units"] = "counts"
|
||||
# nx_rheed["intensity"].attrs["long_name"] = "RHEED intensity"
|
||||
# nx_rheed.attrs["signal"] = "intensity"
|
||||
# nx_rheed.attrs["axes"] = "layer:time:channel"
|
||||
# nx_rheed.attrs["layer_indices"] = [0] # asse layer
|
||||
# nx_rheed.attrs["time_indices"] = [1] # asse tempo
|
||||
# nx_rheed.attrs["channel_indices"] = [2]
|
||||
return
|
||||
|
||||
if __name__=="__main__":
|
||||
# TO-DO: place the API base URL somewhere else.
|
||||
ELABFTW_API_URL = "https://elabftw.fisica.unina.it/api/v2"
|
||||
apikey = getpass("Paste API key here: ")
|
||||
elabid = input("Enter elabid of your starting sample [default= 1111]: ") or 1111
|
||||
elabid = input("Enter elabid of your starting sample [default = 1111]: ") or 1111
|
||||
data = APIHandler(apikey).get_entry_from_elabid(elabid)
|
||||
sample = Entrypoint(data)
|
||||
sample_name = sample.name.strip().replace(" ","_")
|
||||
substrate_object = chain_entrypoint_to_batch(sample) # Substrate-class object
|
||||
layers = chain_entrypoint_to_layers(sample) # list of Layer-class objects
|
||||
n_layers = len(layers) # total number of layers on the sample
|
||||
result = make_nexus_schema_dictionary(substrate_object, layers)
|
||||
# print(make_nexus_schema_dictionary(substrate_object, layers)) # debug
|
||||
with open (f"output/sample-{sample_name}.json", "w") as f:
|
||||
json.dump(result, f, indent=3)
|
||||
build_nexus_file(result, output_path=f"output/sample-{sample_name}-nexus.h5")
|
||||
# TO-DO: remove the hard-coded path of the RWA file
|
||||
# ideally the script should download a TXT/CSV file from each layer
|
||||
# (IF PRESENT ←→ also handle missing file error)
|
||||
# and merge all data in a single file to analyse it
|
||||
with open(f"tests/Realtime_Window_Analysis.txt", "r") as o:
|
||||
osc = np.loadtxt(o, delimiter="\t")
|
||||
try:
|
||||
rheed_osc = analyse_rheed_data(data=osc) or None # analyze rheed data first, build the file later
|
||||
except ValueError as ve:
|
||||
raise ValueError(f"Error with function analyse_rheed_data. {ve}\nPlease make sure the Realtime Window Analysis file is exactly 4 columns wide - where the first column represents time and the others are RHEED intensities.")
|
||||
build_nexus_file(result, output_path=f"output/sample-{sample_name}-nexus.h5", rheed_osc=rheed_osc)
|
||||
|
||||
37931
tests/Realtime_Window_Analysis.txt
Normal file
37931
tests/Realtime_Window_Analysis.txt
Normal file
File diff suppressed because it is too large
Load Diff
Reference in New Issue
Block a user