import sigma
from sigma.utils import normalisation as norm 
from sigma.utils import visualisation as visual
from sigma.utils.load import SEMDataset
from sigma.src.utils import same_seeds
from sigma.src.dim_reduction import Experiment
from sigma.models.autoencoder import AutoEncoder
from sigma.src.segmentation import PixelSegmenter
from sigma.gui import gui

file_path = 'test.bcf'
sem = SEMDataset(file_path)

gui.view_dataset(dataset=sem)

# Rebin both edx and bse dataset
sem.rebin_signal(size=(2,2))

# Remove the first peak until the energy of 0.1 keV
sem.remove_fist_peak(end=0.1) 

# normalisation to make the spectrum of each pixel summing to 1.
sem.peak_intensity_normalisation()

# View the dataset (bse, edx etc.) again to check differences. 
# Note that a new tab (including the binned elemental maps) will show up only if the user runs the sem.rebin_signal.

gui.view_dataset(dataset=sem)

# Normalise the dataset using the (optional) sequential three methods.
sem.normalisation([norm.neighbour_averaging, 
                   norm.zscore,
                   norm.softmax])

gui.view_pixel_distributions(dataset=sem, 
                             norm_list=[norm.neighbour_averaging,
                                        norm.zscore,
                                        norm.softmax], 
                             cmap='inferno')

gui.view_rgb(dataset=sem)

print('After normalisation:')
gui.view_intensity_maps(spectra=sem.normalised_elemental_data, element_list=sem.feature_list)

# The integer in this function can determine different initialised parameters of model (tuning sudo randomness)
# This can influence the result of dimensionality reduction and change the latent space.
same_seeds(1)

# set the folder path to save the model(the model will automatically save in the specified folder)
result_folder_path='./' 

# Set up the experiment, e.g. determining the model structure, dataset for training etc.
ex = Experiment(descriptor='softmax',
                general_results_dir=result_folder_path,
                model=AutoEncoder,
                model_args={'hidden_layer_sizes':(512,256,128)}, 
                chosen_dataset=sem.normalised_elemental_data,
                save_model_every_epoch=False)

# Train the model
ex.run_model(num_epochs=20,
             batch_size=32,
             learning_rate=1e-4, 
             weight_decay=0.0, 
             task='train_all', 
             criterion='MSE'
            ) 
latent = ex.get_latent()

# model_path = './'  # model path (the model path should be stored in the folder 'result_folder_path')
# ex.load_trained_model(model_path)

gui.view_bic(latent=latent,
             model='GaussianMixture',
             n_components=14,
             model_args={'random_state':6, 'init_params':'kmeans'})

ps = PixelSegmenter(latent=latent, 
                    dataset=sem,
                    method="GaussianMixture",
                    method_args={'n_components':14, 'random_state':6, 'init_params':'kmeans'} )
                    # can change random_state to different integer i.e. 10 or 0 to adjust the clustering result.

# Plot latent sapce (2-dimensional) with corresponding Gaussian models
gui.view_latent_space(ps=ps, color=True)

# visualise the latent space
gui.check_latent_space(ps=ps,ratio_to_be_shown=1.0, show_map=True)

# check the density of latent space
gui.plot_latent_density(ps=ps, bins=50)

# ps.set_feature_list(['Al_Ka', 'C_Ka', 'Ca_Ka', 'Fe_Ka', 'K_Ka', 'O_Ka', 'Si_Ka', 'Ti_Ka', 'Zn_La'])
gui.show_cluster_distribution(ps=ps)

# Plot phase map using the corresponding GM model
gui.view_phase_map(ps=ps, alpha_cluster_map=0.5)

gui.view_clusters_sum_spectra(ps=ps, normalisation=True, spectra_range=(0,8))

weights, components = ps.get_unmixed_spectra_profile(clusters_to_be_calculated='All', 
                                                 n_components='All',
                                                 normalised=False, 
                                                 method='NMF', 
                                                 method_args={'init':'nndsvd'})

gui.show_unmixed_weights_and_compoments(ps=ps, weights=weights, components=components)

gui.show_abundance_map(ps=ps, weights=weights, components=components)

gui.show_cluster_stats(ps=ps)

Import libraries¶

Load files¶

1. Dataset preprocessing¶

1.1 View the dataset¶

1.2 Process the dataset¶

Several (optional) functions to process the dataset:¶

1.3 Normalisation¶

1.4 (Optional) Assign RGB to elemental peaks¶

1.5 Check elemental distribution after normalisation¶

2. Dimensionality reduction¶

2.1 Method 1: Autoencoder¶

2.1.1 Initialise experiment / model¶

2.1.2 Training¶

(Optional) Load pre-trained Autoencoder¶

3. Pixel segmentation:¶

3.1 Method 1: Gaussian mixture modelling (GMM) clustering¶

3.1.1 Measure Baysian information criterion (BIC)¶

3.1.2 Run GMM¶

3.3 Visualisation¶

3.3.1 Checking latent space¶

3.3.2 Checking each clusters¶

3.3.3 Checking cluster map¶

4. Unmixing cluster spectrums using Non-negative Matrix Fatorization (NMF)¶

Check abundance map for components (using RGB maps)¶

Statistics infro from clusters¶