best_estimates.m

% Create TAB files containing the current best estimates of plasma parameters.
% 
%
% NOTES
% =====
% NOTE: Presently only based on probe 1 sweeps, one estimate per (probe 1) sweep.
%
% IMPORTANT NOTE: Uses the non-PDS compliant first row
% of column headers in AxS to label variables (struct fields).
% When/if that becomes PDS compliant, this code WILL NOT WORK!
%    
% IMPORTANT NOTE: Uses file existence to check for existence of pre-sweep low-freq. bias potential.
%
% IMPORTANT NOTE: This function may have a memory problem for large files or large datasets.
%    May therefore contain extra code on memory use. Only a limited effort on reducing
%    memory usage have been made so far.
%
% NOTE: Uses global variables MISSING_CONSTANT.
%
function an_tabindex = best_estimates(an_tabindex, tabindex, index, obe)

%===========================================================================================
% NOTE: In principle: Not one EST file per A1S/A2S file, but
% per operations block (both probes together). 
%
% NOTE: importdata omits columns without numbers.
% ==> Matrices of numbers (not strings) from some AxS files have
% fewer columns ==> Nbr of column names and nbr of columns don't match.
%
% FOOTNOTE: Have not found any hard source code which specifies the
% exact length of UTC-time strings. ==> One has to "measure" the
% length manually for now.
% Ex: "2014-08-31T22:14:24.369327" ==> 10 + 1 + 8 + 1 + 6 = 26 bytes
%
% TODO: Better way to connect an_tabindex nbr-of-columns to file-writing code.
%
% TODO: Not rely on non-PDS compliant AxS first-line column headers.
%    PROPOSAL: Use general ODL/LBL reading code?
%       CON: Can not presently (2014-11-25) make use of the corresponding LBL file
%            for finding column names since the LBL file has not yet been created at
%            this stage in the execution of lapdog.
%
% PROPOSAL: Change to model with all sweep analysis data in one table (add probe number field to distinguish probes)
% PROPOSAL: Change to using cell arrays instead of structs with array fields.
%     data.data, data.col_names
%     PROPOSAL: Separate cell arrays for strings and numeric values.
%         PRO: Can easily search/select sweeps depending on parameters (time, direction, probe). 
%
% PROPOSAL: Remove Vsc values equal or lower/higher than lowest/highest sweep bias.
%   NOTE: Sweep bias values can be read from B?S.TAB files.
%
% PROPOSAL: Convert "an_tabindex", "tabindex" to structs.
%   NOTE: "index" already is a struct.
%   NOTE: "an_tabindex" is returned to the caller. "Must" be able to convert back.
%   PROPOSAL: Reuse code for conversion of "an_tabindex" and "tabindex".
%
% TODO: Check whether to expect low-freq bias potential using macro, instead of checking file existence?
% TODO: Remove references to "et" times. Use OBT.
%
% NOTE/BUG: It is perfectly possible for there to legitimately be no IxL/IxH file for short time
% intervals within a UTC day, e.g. a macro that starts just before midnight.
% ==> There might not have been any IxL/H measurements at all.
% ==> Absence of IxL/H TAB file is not an indication of error.
% The current implementation of code does not appear to take this possibility into account and gives error when there should be none.
% NOTE/BUG: !!! Tentatively, it appears that tabindex may contain references to IxLH files that do not exist. If that is fixed,
% the bug is fixed.
% Example: 2015/MAY/D01/RPCLAP_20150501_235959_807*
%    PROPOSAL: try-catch for every particular EST file, not for all EST files together.
%    PROPOSAL: try-catch for reading IxL/H files and permit absence of file.
%-------------------------------------------------------------------------------------------
% MEMORY PROBLEM:
% ---------------
% PROPOSAL: Eliminate main_INTERNAL function to eliminate temporary variables (in particular "index" is sizable).
%    CON: "Ugly" having try-catch covering all code.
% PROPOSAL: Do not build up PO_table.
%===========================================================================================

    global MISSING_CONSTANT

    try
        warnings_settings = warning('query');
        warning('on', 'all')
        
        MEMORY_USE_LOG_ENABLED = 0;  % Enable/disable memory usage log output. Printouts should be removed permanently some day.
        t_start = clock;             % NOTE: Not number of seconds, but [year month day hour minute seconds].
    
        an_tabindex = main_INTERNAL(an_tabindex, tabindex, index, obe, MISSING_CONSTANT, MEMORY_USE_LOG_ENABLED);
    
        fprintf(1, '%s: %0.f s (elapsed wall time)\n', mfilename, etime(clock, t_start));
        
        warning(warnings_settings)
    catch err
        fprintf(1,'\nlapdog:best_estimates error message: %s\n',err.message);
        
        len = length(err.stack);
        if (~isempty(len))
            for i=1:len
                fprintf(1,'%s, %i,\n', err.stack(i).name, err.stack(i).line);
            end
        end
    end
    
end


% #############################################################################################


% UNFINISHED
function an_tabindex = main_INTERNAL(an_tabindex, tabindex, index, obe, MISSING_CONSTANT, memory_use_log_enabled)
    
    nob = length(obe);
    
    if isempty(an_tabindex)
        warning('"an_tabindex" is empty.')
    end
    
    
    %------------------------------------------------------------------------------------------
    % Create table of data from resp. probes. Table has indices (<ops block>, <probe number>).
    %
    % NOTE: Not all entries will necessarily be assigned.
    % Some ops blocks may not contain sweeps, some may sweep on only one probe, or none.
    % NOTE: ant = "an_tabindex"
    %------------------------------------------------------------------------------------------
    i_ant_list = find(strcmp(an_tabindex(:,7), 'sweep'));   % ant = "an_tabindex"
    PO_table = cell(nob, 2);               % PO = probe-operations block. Data for one probe during one ops block.
    O_list   = cell(nob, 1);               % O  = operations block. Data for one operations block (in practice EST, if contains sweeps).
    for i_ant = i_ant_list(:)'      % for every 'sweep' file ...   (List of values must be row vector for iteration to work.)
        PO = [];
        PO.i_ant = i_ant;
        
        % Find i_ob and i_probe.
        i_ind = an_tabindex{i_ant, 3};                  % ind = "index" (the index of CALIB files)
        i_ob = find(obe >= i_ind, 1);                   % ob = Operations block.
        i_probe = index(an_tabindex{i_ant, 3}).probe;
        
        % Determine AxS, EST, IxL filenames & paths.
        % NOTE: Ugly. Uses previous file name/path.
        AxS_file_path = an_tabindex{i_ant, 1};
        AxS_file_name = an_tabindex{i_ant, 2};
        EST_file_path              = AxS_file_path;
        EST_file_path(end-6:end-4) = 'EST';
        EST_file_name              = AxS_file_name;
        EST_file_name(end-6:end-4) = 'EST';
        IxL_file_path              = AxS_file_path;
        IxL_file_path(end-6:end-4) = sprintf('I%iL', i_probe);
        IxH_file_path              = AxS_file_path;
        IxH_file_path(end-6:end-4) = sprintf('I%iH', i_probe);
        BxS_file_path              = AxS_file_path;
        BxS_file_path(end-6:end-4) = sprintf('B%iS', i_probe);
        
        [PO.data, N_sw] = read_AxS_file_INTERNAL(AxS_file_path, i_probe);
        
        %-----------------------------------------------------------------------------------------------------------
        % Add most recent low frequency bias potential before every individual sweep
        % --------------------------------------------------------------------------
        % (Might not be relevant if sweep is preceeded by other sweep but that is not decided here in the code.)
        % NOTE: Special case: First sweep might not have a preceeding low freq. bias potential in the same ops block.
        % NOTE: Special case: It takes time to change/set bias and the immediately following value(s) may be faulty.
        %
        % IMPORTANT NOTE: Code uses tabindex to check for existence of pre-sweep LF/HF data. TODO: Change?
        %-----------------------------------------------------------------------------------------------------------
        IxLH_data = [];
        if     sum(strcmp({tabindex{:,1}}, IxL_file_path))
            IxLH_data = read_IxLH_file_bias_voltage_INTERNAL(IxL_file_path, i_probe, memory_use_log_enabled);
        elseif sum(strcmp({tabindex{:,1}}, IxH_file_path))
            IxLH_data = read_IxLH_file_bias_voltage_INTERNAL(IxH_file_path, i_probe, memory_use_log_enabled);
        end
        if ~isempty(IxLH_data)
            for i_sw = 1:N_sw
                i_IxLH = find(IxLH_data.TIME_OBT < PO.data.START_TIME_OBT(i_sw), 1, 'last');    % Intermediate value, for clarity and debugging.
                if ~isempty(i_IxLH)
                    PO.data.V_LF_HF_before_sweep(i_sw, 1) = IxLH_data.V_bias(   i_IxLH   );
                else
                    PO.data.V_LF_HF_before_sweep(i_sw, 1) = NaN;
                end
            end
        else
            PO.data.V_LF_HF_before_sweep = zeros(N_sw, 1) + NaN;
        end
        
        % Read lowest/highest V_bias for sweeps.
        [PO.V_bias_min, PO.V_bias_max] = read_BxS_min_max_bias_voltage_INTERNAL(BxS_file_path);
        
        % NOTE: May overwrite the component with the same EST path (but that is not a problem).
        O_list{i_ob}.EST_file_path = EST_file_path;
        O_list{i_ob}.EST_file_name = EST_file_name;
        
        PO_table{i_ob, i_probe} = PO;
        clear PO
        if memory_use_log_enabled
            fprintf(1, 'main_INTERNAL: End of iteration in first loop - call "whos PO_table"\n')
            whos PO_table   % DEBUG
        end
    end
    if memory_use_log_enabled
        fprintf(1, 'main_INTERNAL: After first loop - call "whos PO_table index"\n')
        whos PO_table index% DEBUG
    end
    
    
    %---------------------------------------------------------------------
    % Iterate over operations blocks and ignore those without sweep data,
    % i.e. iterate over EST files.
    %---------------------------------------------------------------------
    for i_ob = 1:nob    % for every ops block ...
        
        %----------------------------------------------------------
        % DEBUG:
        % Filter out sweeps to test code.
        %PO_table{i_ob, 1} = [];
        %----------------------------------------------------------
        
        %PO1 = PO_table{i_ob, 1};
        %PO2 = PO_table{i_ob, 2};
        
        if isempty(PO_table{i_ob, 1}) && isempty(PO_table{i_ob, 2})
            continue
        end
        
        
        %--------------------------------------------------------
        % Compile all sweeps into one table.
        % ----------------------------------
        % IMPLEMENTATION NOTE: Can NOT merge this code into one
        % merge_structs_arrays_INTERNAL({PO1.data, PO2.data})
        % command since it is uncertain whether PO1 and PO2 are empty,
        % not whether PO1.data/PO2.data themselves are empty.
        %--------------------------------------------------------
        % --- Older implementation. Delete? ---
        %sweep_data = [];
        %V_bias_limits = {[], []};
        %if ~isempty(PO1)
        %    sweep_data = PO1.data;
        %    V_bias_limits{1} = struct('V_bias_min', PO1.V_bias_min, 'V_bias_max', PO1.V_bias_max);
        %end
        %if ~isempty(PO2)
        %    sweep_data = merge_structs_arrays_INTERNAL({sweep_data, PO2.data});
        %    V_bias_limits{2} = struct('V_bias_min', PO2.V_bias_min, 'V_bias_max', PO2.V_bias_max);
        %end
        %----------------------------------------
        sweep_data = [];
        V_bias_limits = {[], []};
        for i_P = 1:2     % For every probe ...
            PO = PO_table{i_ob, i_P};
            
            if ~isempty(PO_table{i_ob, i_P})
                sweep_data = merge_structs_arrays_INTERNAL({sweep_data, PO.data});
                V_bias_limits{i_P} = struct('V_bias_min', PO.V_bias_min, 'V_bias_max', PO.V_bias_max);
            end
        end
        N_sw = length(sweep_data.MIDDLE_TIME_OBT);
        
        
        %--------------------------------
        % Derive best estimates ("est").
        %--------------------------------
        sim_sweep_data_grps_list = group_simultaneous_sweeps_INTERNAL(sweep_data);
        N_grps = length(sim_sweep_data_grps_list);
        if (N_grps == 0)
            %--------------------------------------------------------------------------------------
            % In case there are not enough sweeps for a single group of sweeps, do not even try to
            % create an EST file. The below code would break anyway as "est_sweep_data" will
            % contain no fields.
            % BUG/TODO?: This could also be seen as a bug. Modify
            % group_simultaneous_sweeps_INTERNAL to produce one last
            % "incomplete" group of sweeps?
            % NOTE: If no EST file is produced, then there should also be no corresponding LBL file.
            % --------------------------------------------------------------------------------------
            % I think the data archiving policy is that when there is no data,
            % there should also be no file. (Source?) /Erik P G Johansson 2015-01-08.
            %---------------------------------------------------------------------------------------
            fprintf(1, 'best_estimates: Too few sweeps in ops block for best estimates (not error).\n')
            fprintf(1, '==> Skipping: %s\n', O_list{i_ob}.EST_file_path)
            continue
        end
        
        est_sweep_data_grps_list = cell(N_grps, 1);
        for i_grp = 1:N_grps       % NOTE: i_grp != est_sweep_data_grps_list{i_grp}.sweep_group_nbr
            est_sweep_data_grps_list{i_grp} = select_best_estimates_INTERNAL(sim_sweep_data_grps_list{i_grp}, V_bias_limits);
        end
        est_sweep_data = merge_structs_arrays_INTERNAL(est_sweep_data_grps_list);
        
        
        [row_bytes, N_columns, N_rows] = write_EST_file_INTERNAL(O_list{i_ob}.EST_file_path, est_sweep_data, MISSING_CONSTANT);
        
        
        %------------------------------------------------------
        % Update an_tabindex.
        % -------------------
        % Time start/stop is the only one that is non-trivial.
        % Two values can not be set to anything (?).
        %------------------------------------------------------
        timing_start_list = [];
        timing_stop_list  = [];
        timing_list       = {};
        i_index           = [];
        for i_P = 1:2
            P = PO_table{i_ob, i_P};
            if ~isempty(P)
                timing_start_list(end+1) = str2num(an_tabindex{P.i_ant, 8}{3});
                timing_stop_list(end+1)  = str2num(an_tabindex{P.i_ant, 8}{4});
                timing_list(end+1)       = an_tabindex(P.i_ant, 8);
                i_index(end+1)           = an_tabindex{P.i_ant, 3};
            end
        end
        [junk, i_start] = min(timing_start_list);
        [junk, i_stop]  = max(timing_stop_list);
        an_tabindex_timing = { ...
            timing_list{i_start}{1}, ...
            timing_list{i_stop }{2}, ...
            timing_list{i_start}{3}, ...
            timing_list{i_stop }{4} ...
            };
        an_tabindex_amendment{1, 1} = O_list{i_ob}.EST_file_path;    % File path
        an_tabindex_amendment{1, 2} = O_list{i_ob}.EST_file_name;    % Filename
        an_tabindex_amendment{1, 3} = i_index;      % Index back to corresponding "index" file. ARRAY. Otherwise not meaningful?!!
        an_tabindex_amendment{1, 4} = N_rows;
        an_tabindex_amendment{1, 5} = N_columns;
        an_tabindex_amendment{1, 6} = [];               % Index back to corresponding "tabindex" file. - CAN NOT BE MEANINGFULLY SET?!!
        an_tabindex_amendment{1, 7} = 'best_estimates';
        an_tabindex_amendment{1, 8} = an_tabindex_timing;
        an_tabindex_amendment{1, 9} = row_bytes;
        an_tabindex(end+1, :) = an_tabindex_amendment;
    end
    
    %warning('Implementation of function not finished yet.')              % TEMPORARY
end


% #############################################################################################


%------------------------------------------------------------------------------------------------
% Given a set of sweeps, return groups of approximately simultaneous sweeps for
% "select_best_estimates_INTERNAL" to work on (one group at a time), i.e. what is relevant for.
%
% NOTE: The grouped sweeps should preferably/probably not overlap,
% and preferably/probably together represent all sweeps.
% This depends on the exact implementation of "select_best_estimates_INTERNAL".
%
% sim = simultaneous; sw = sweep
%
% ARGUMENTS
% =========
% sw_data : 1x1 struct with fields which are same-sized 1D arrays.
%------------------------------------------------------------------------------------------------
function [sim_sweep_data_grps_list] = group_simultaneous_sweeps_INTERNAL(sw_data)
    % QUESTION: How handle situation if number of sweeps is not an even multiple of natural "groups"? How handle such an ending?
    % QUESTION: Expect time-sorted data or sort oneself?
    %
    
    N_sw = length(sw_data.MIDDLE_TIME_OBT);
    
    %--------------------
    % Sort data by time.
    %--------------------
    [junk, i_sort] = sort(sw_data.MIDDLE_TIME_OBT);
    sw_data = select_structs_arrays_INTERNAL(sw_data, i_sort);
    
    
    %---------------------------------------------------------------------------------------------------------------
    % Assigns variables:
    % has_Pi             : [i] = Number of sweeps on probe i (in practice only used for distinction zero, non-zero). Size 1x2.
    % has_Pi_pairs       : [i] = True iff there is (at least one) sweep pair on probe i.
    % sw_data.pair_first : [i] = True iff sweep i is the first in a sweep pair.
    %                      New field which is added to sw_data.
    %---------------------------------------------------------------------------------------------------------------
    has_Pi             = [];
    has_Pi_pairs       = [];
    sw_data.pair_first = zeros(N_sw, 1);      % Index to next sweep in pair, if there is any.
    for i_P = 1:2
        i_Pi        = find(sw_data.probe_nbr == i_P);
        has_Pi(i_P) = length(i_Pi);
        
        if has_Pi(i_P)
            j_swp1 = find(   sw_data.STOP_TIME_OBT(i_Pi(1:end-1)) == sw_data.START_TIME_OBT(i_Pi(2:end))   );    % j_swp1 : Sweeps which are first in pairs.
            sw_data.pair_first(i_Pi(j_swp1)) = 1;
            has_Pi_pairs(i_P) = length(j_swp1) > 0;
        else
            has_Pi_pairs(i_P) = 0;
        end
    end
    
    
    %--------------------------------------------------------------------------
    % Sort sweeps in groups.
    % Current algorithm will (intentionally) omit some sweeps for sufficiently
    % strange macros, but such macros probably do not exist. Should be robust.
    %--------------------------------------------------------------------------
    i_sw = 1;
    i_grp = 0;
    sim_sweep_data_grps_list = {};
    while true    % Iterate over groups of sweeps.
        
        Pi_complete = ~has_Pi;
        i_Pi_prev = [0, 0];      % Previous sweep for given probe.
        i_sw_group = [];
        while (~Pi_complete(1) | ~Pi_complete(2)) & (i_sw <= N_sw)     % Iterate over sweeps until one has collected a group of sweeps.
            
            for i_P = 1:2              % For every probe...
                
                if   ~Pi_complete(i_P)   &&   (sw_data.probe_nbr(i_sw) == i_P)
                    
                    if has_Pi_pairs(i_P)
                        if   (i_Pi_prev(i_P) ~= 0)   &&   sw_data.pair_first( i_Pi_prev(i_P) )
                            % CASE: If this sweep and preceeding sweep for the same probe are a pair...
                            
                            i_sw_group(end+1) = i_Pi_prev(i_P);
                            i_sw_group(end+1) = i_sw;
                            Pi_complete(i_P) = 1;
                            i_Pi_prev(i_P) = 0;
                        else
                            i_Pi_prev(i_P) = i_sw;
                        end
                    elseif has_Pi(i_P)
                        i_sw_group(end+1) = i_sw;
                        Pi_complete(i_P) = 1;
                    else
                        Pi_complete(i_P) = 1;
                    end
                    
                end
            end   % for
            
            i_sw = i_sw + 1;
            
        end   % while
        
        
        if (i_sw > N_sw)
            break
        end
        
        sim_sweep_data = select_structs_arrays_INTERNAL(sw_data, i_sw_group');
        sim_sweep_data.sweep_group_nbr = ones(length(i_sw_group), 1) * i_grp;  % For debugging. Save which group every sweep belongs to.
        sim_sweep_data_grps_list{end+1} = sim_sweep_data;
        i_grp = i_grp + 1;
        
    end   % while
    
end


% #############################################################################################


%==================================================================================
% IMPLEMENTATION OF FUNCTION: Version 2.0
%
% Given a set of sweeps "sim_sweep_data" which are to be regarded as "approximately simultaneous",
% return a set of best estimates based upon them.
% Exact assumptions for the set of sweeps in the argument depends on "group_simultaneous_sweeps_INTERNAL".
%
%
% ARGUMENTS
% =========
% sim_sweep_data : "Simultaneous sweeps data". 1x1 struct where fields are same-sized 1D arrays.
%                   Struct containing the same set of values and parameters for each
%                   sweep in a group of "approximately simultaneous" sweeps.
%
%
% IMPLEMENTATION NOTE
% ===================
% In principle, this function does a lot of work that is redone for every sweep group that
% could probably be done for every operations block.
% However, the "architecture" is chosen (1) to produce clear and unambiguous (and safe) code
% for lots of cases (number of available probes, number of available sweeps, and order of
% up/down sweeps), and (2) to be easily modified (safely).
%
%
% CURRENT IMPLEMENTATION: Assumes 0-2 sweeps from each probe.
% NOTE: If there are two sweeps on same probe, then they are assumed to be a "pair" (immediately adjacent in time).
% NOTE: It is possible to assign a variable at index [] without error. Nothing happens but MATLAB permits it.
%
% QUESTION: How gain access to V_bias_min/max?
%   NOTE: One pair of values per probe (and entire ops block, not sweep).
%==================================================================================
function data_est = select_best_estimates_INTERNAL(sim_sweep_data, V_bias_limits)
    
    Vsc_BIAS_EXCLUSION_MARGIN_FRACTION = 0.01;
    
    data = sim_sweep_data;    % Change name of variable.
    % Modify specific fields: Change from strings to numeric values.
    data.direction      = str2double(data.direction);
    data.Illumination   = str2double(data.Illumination);
    %data.asm_ni_v_indep = str2double(data.asm_ni_v_indep);
    data.asm_ne_5eV     = str2double(data.asm_ne_5eV);
    data.asm_Te_exp     = str2double(data.asm_Te_exp);
    %data.asm_Vsg        = str2double(data.asm_Vsg);
    data.Vph_knee       = str2double(data.Vph_knee);
    
    % Find index to first/second sweep in pair for P2.
    % 1st/2nd = first/second sweep (of sweep pair on the same probe).
    % BUG: Can NOT handle only one sweep.    (false??? /EJ 2015-01-09)
    m = sort(find(data.probe_nbr == 2));     % ASSUMES: data/sweeps sorted in ascending time-order, so that index increases with time.
    if length(m) >= 1
        i_P2_1st = m(1);
    else
        i_P2_1st = [];
    end
    if length(m) == 2
        i_P2_2nd = m(2);
    else
        i_P2_2nd = [];
    end
    has_P2_updn_pair = ~isempty(i_P2_1st) && (data.direction(i_P2_1st) == 1) && ~isempty(i_P2_2nd) && (data.direction(i_P2_2nd) == 0);   % NOTE: Uses && so not to require i_P2_1st.
    
    %=========================================================================================
    % Derive arrays (possibly empty) of indices into struct data's fields for sweeps which satisfy certain criteria.
    %
    % Variable naming convention:
    % ---------------------------
    % P1/P2 = Probe 1/2
    % up/dn = Up/down sweep.
    % updn = There is an up-down pair of sweeps (on this probe; in this sweep group).
    % pb = "Positive bias", i.e. V_LF_HF_before_sweep > 0.
    % nb = "Negative bias", i.e. V_LF_HF_before_sweep <= 0.
    % sh = Shade. NOTE: Illumination can take on values 0, 0.4 (illumination unknown), and 1.
    % il = Illuminated.
    %=========================================================================================
    i_P1_up            = find((data.probe_nbr == 1) & (data.direction == 1));
    i_P1_dn            = find((data.probe_nbr == 1) & (data.direction == 0));
    
    i_P1_up_il         = find((data.probe_nbr == 1) & (data.direction == 1) & (data.Illumination == 1));
    i_P1_dn_il         = find((data.probe_nbr == 1) & (data.direction == 0) & (data.Illumination == 1));
    i_P2_up_il         = find((data.probe_nbr == 2) & (data.direction == 1) & (data.Illumination == 1));
    i_P2_dn_il         = find((data.probe_nbr == 2) & (data.direction == 0) & (data.Illumination == 1));
    i_P2_up_il_nb      = find((data.probe_nbr == 2) & (data.direction == 1) & (data.Illumination == 1) & (data.V_LF_HF_before_sweep <= 0));
    i_P2_dn_il_pb      = find((data.probe_nbr == 2) & (data.direction == 0) & (data.Illumination == 1) & (data.V_LF_HF_before_sweep >  0));
    
    i_P2_up_sh         = find((data.probe_nbr == 2) & (data.direction == 1) & (data.Illumination == 0));
    i_P2_dn_pb_updn    = find((data.probe_nbr == 2) & (data.direction == 0) &                            (data.V_LF_HF_before_sweep >  0) & has_P2_updn_pair);
    i_P2_dn_pb_updn_sh = find((data.probe_nbr == 2) & (data.direction == 0) & (data.Illumination == 0) & (data.V_LF_HF_before_sweep >  0) & has_P2_updn_pair);
    
    % Clear fields that are to be used, both to be sure they exist and that they are "empty".
    data.npl_est = zeros(size(data.START_TIME_UTC)) + NaN;
    data.Te_est  = zeros(size(data.START_TIME_UTC)) + NaN;
    data.Vsc_est = zeros(size(data.START_TIME_UTC)) + NaN;
    
    %=====================================================================================
    % Create priority lists of sweeps to use for different values.
    % ------------------------------------------------------------
    % IMPLEMENTATION NOTE: Must concatenate vertically to avoid warning messages.
    % Variables such as i_P1_up etc are either empty 0x1 matrices, or 1x1 matrices.
    % These can/should not be concatenated horisontally since they have different height,
    % but vertically since they have the same width.
    %=====================================================================================
    i_npl_priority_list = [i_P2_dn_pb_updn;          i_P2_up_sh;      i_P1_up;         i_P1_dn];
    i_Te_priority_list  = [i_P2_dn_pb_updn_sh;       i_P2_up_sh;      i_P1_up;         i_P1_dn];
    i_Vsc_priority_list = [i_P1_up_il; i_P1_dn_il;   i_P2_up_il_nb;   i_P2_dn_il_pb;   i_P2_up_il; i_P2_dn_il];    %  NEW
    
    
    %===============================================================================
    % Select estimates to use, if any.
    % --------------------------------
    % NOTE: Only moves down the priority lists for conditions which change rarely
    % i.e. illumination, V_bias_before_sweep,
    % but NOT NaN or out-of-(realistic)-range.
    %===============================================================================
    
    % Set plasma density: data.npl_est(i)
    for i = i_npl_priority_list'   % Must be row vector.
        %npl = data.asm_ni_v_indep(i);
        npl = data.asm_ne_5eV(i);
        
        if ~isempty(npl)
            if ~isnan(npl) &&  (npl > 0)
                data.npl_est(i) = npl;
            end
            break
        end
        clear npl     % Erase variable to prevent accidentally reusing it when e.g. copy-pasting.
    end
    
    % Set electron temperature: data.Te_est(i)
    for i = i_Te_priority_list'   % Must be row vector.
        Te = data.asm_Te_exp(i);
        
        if ~isempty(Te)
            if ~isnan(Te) && (Te > 0)
                data.Te_est(i) = Te;
            end
            break
        end
        
        clear Te     % Erase variable to prevent accidentally reusing it when e.g. copy-pasting.
    end
    
    % Set spacecraft potential: data.Vsc_est(i)
    for i = i_Vsc_priority_list'   % Must be row vector.
        Vsc = data.Vph_knee(i);
        
        if ~isempty(Vsc)
            % NOTE: Calculation of V_min, V_max should/could be outside of loop? Outside of function?!
            V_min = V_bias_limits{data.probe_nbr(i)}.V_bias_min;
            V_max = V_bias_limits{data.probe_nbr(i)}.V_bias_max;
            V_margin = (V_max-V_min) * Vsc_BIAS_EXCLUSION_MARGIN_FRACTION;
            V_min = V_min + V_margin;
            V_max = V_max - V_margin;
            
            if   ~isnan(Vsc)   &&   (V_min <= Vsc)   &&   (Vsc <= V_max)
                %if   ~isnan(Vsc)
                data.Vsc_est(i) = Vsc;
            end
            break
        end
        
        clear Vsc     % Erase variable to prevent accidentally reusing it when e.g. copy-pasting.
    end
    
    %i_selected = ???           % TODO?
    %data_est = select_structs_arrays_INTERNAL(data_est, i_selected);
    data_est = data;
end


% #############################################################################################


% Writes EST TAB file.
%
% ARGUMENTS
% =========
% MISSING_CONSTANT : PDS' MISSING_CONSTANT.
%
% NOTE: Can/should handle handle empty values in the form of [].
%       str2double([]) = NaN,
%       str2num([]) ==> Syntax error
%       length(sprintf('%14.7e', NaN)) = 14
%       length(sprintf('%14s',   [] )) = 14
function [row_bytes, N_columns, N_rows] = write_EST_file_INTERNAL(EST_file_path, data, MISSING_CONSTANT)
    
    %fprintf(1, 'Writing file: %s\n', EST_file_path);        % Log message / DEBUG
    
    %--------------------
    % Sort data by time.
    %--------------------
    [junk, i] = sort(data.START_TIME_UTC);
    O_data = select_structs_arrays_INTERNAL(data, i);
    N_rows = length(data.START_TIME_UTC);
    
    
    i = find(isnan(O_data.npl_est));   O_data.npl_est(i) = MISSING_CONSTANT;   % NOTE: MISSING_CONSTANT is "function global" constant.
    i = find(isnan(O_data.Te_est));    O_data.Te_est(i)  = MISSING_CONSTANT;
    i = find(isnan(O_data.Vsc_est));   O_data.Vsc_est(i) = MISSING_CONSTANT;
    
    
    %----------------
    % Write to file.
    %----------------
    fid = fopen(EST_file_path, 'w');
    for i = 1:N_rows
        % NOTE: Most (but not all) variables are STRINGS!
        line = [];
        line = [line, sprintf('%s, %s, ',                 data.START_TIME_UTC{i}, data.STOP_TIME_UTC{i})];
        line = [line, sprintf('%16.6f, %16.6f, %s, ',     data.START_TIME_OBT(i), data.STOP_TIME_OBT(i),   data.Qualityfactor{i})];
        line = [line, sprintf('%14.7e, %14.7e, %14.7e, ', O_data.npl_est(i), O_data.Te_est(i), O_data.Vsc_est(i))];
        
        line = [line, sprintf('%1i, ',    data.probe_nbr(i))];             % DEBUG?
        line = [line, sprintf('%1i, ',    data.direction(i))];             % DEBUG?
        line = [line, sprintf('%04.2f, ', data.Illumination(i))];          % DEBUG?
        %line = [line, sprintf('%16.6e, ', data.V_LF_HF_before_sweep(i))];  % DEBUG
        line = [line, sprintf('%5i',      data.sweep_group_nbr(i))];       % DEBUG? NOTE: The only string without ending comma!
        N_columns = 2+3+3 + 1+1+1+1;
        row_bytes = fprintf(fid, [line, '\r\n']);
        
        %disp(line)                     % DEBUG. Preferably no extra linebreak in string.
    end
    fclose(fid);
    
end


% #############################################################################################


%=============================================================================
% Reads AxS file
% --------------
% IMPORTANT NOTE: Uses the non-PDS compliant first row
% of column headers in AxS to label variables (names of struct fields).
% When that becomes PDS compliant, this code WILL NOT WORK!
% ---------------------------------------------------------
% NOTE: Returns only strings, except for added fields.
% No conversion strings-to-numbers since that
% would involve interpreting the meaning of values.
% -------------------------------------------------------
% Quite general function for files with first row as column headers. Could in
% principle be repurposed as a general function for general use.
%=============================================================================
function [data, N_rows] = read_AxS_file_INTERNAL(file_path, probe_nbr)
    %
    % PROPOSAL: Assume all (unspecified) fields are numerical and convert to numeric.
    % PROPOSAL: Remove return value N_rows?
    %
    % PROPOSAL: Rename _et to _arbitrary since probably no particular offset/origin and misleading.
    
    line_list = importdata(file_path, '\n');               % Read file into cell array, one line per cell.
    line_value_list = regexp(line_list, ',', 'Split');     % Split strings using delimiter.
    if (length(line_value_list) >= 2) && (length(line_value_list{1}) ~= length(line_value_list{2}))
        error('Error in AxS file %s: The number of column names on the first line is NOT equal to the number of data columns. Can therefore not interpret columns.', file_path)
    end
    value_list = vertcat(line_value_list{:});              % Concatenate (cell) array of (cell) arrays to create one long vector (Nx1).
    
    N_rows = length(line_value_list);
    N_cols = length(line_value_list{1});                   % NOTE: Requires at least one row.
    file_contents = reshape(value_list, N_rows, N_cols);   % Derive 2D table from 1D vector. NOTE: Incomplete test of equal number of columns per line.
    
    N_rows = N_rows - 1;                         % Number of rows of DATA (excluding first line of column headers).
    file_column_name_list = file_contents(1,:);
    file_data             = file_contents(2:end, :);
    
    data = [];
    for i = 1:N_cols     % For every column ...
        % DEBUG
        %disp(['i = ', num2str(i)])
        %disp(['file_column_name_list{i} = ', file_column_name_list{i}])
        
        col_name = file_column_name_list{i};    % skey = struct key/field name
        skey = strrep(col_name, '(', '_');
        skey = strrep(skey,     ')', '' );     % NOTE: Remove right bracket (as opposed to left bracket which is replaced).
        skey = strrep(skey,     '=', '' );
        skey = strrep(skey,     '.', '_');
        skey = strrep(skey,     ' ', '' );
        
        % NOTE: Using delimiter ',' to find columns implies one has to
        % trim away leading and trailing white space from columns that could be
        % interpreted as strings. If the real delimiter for writing TAB files
        % is ', ' (comma+whitespace) then the extra whitespace will
        % otherwise end up in the string when reading.
        
        if isfield(data, skey)
            error('Trying to add the same structure field name a second time.');
            skey
            data
        end
        data.(skey) = strtrim(file_data(1:end, i));     % NOTE: Trimming and copying strings. No conversion strings-to-numbers.
    end
    
    %---------------------------------------------------------------------------------------
    % Add extra fields that may be needed by algorithms that choose information from
    % the different probes at only approximately the same time.
    %---------------------------------------------------------------------------------------
    %for i_row = 1:N_rows
    %    START_TIME_et(i_row, 1) = cspice_str2et(data.START_TIME_UTC(i_row));
    %    STOP_TIME_et(i_row, 1)  = cspice_str2et(data.STOP_TIME_UTC(i_row));
    %end
    %data.START_TIME_et = START_TIME_et;    % NOTE: Adds additional field.
    %data.STOP_TIME_et  = STOP_TIME_et;     % NOTE: Adds additional field.
    %data.MIDDLE_TIME_et = (START_TIME_et + STOP_TIME_et) * 0.5;    % NOTE: Adds additional field.
    data.START_TIME_OBT = str2double(data.START_TIME_OBT);
    data.STOP_TIME_OBT  = str2double(data.STOP_TIME_OBT);
    data.MIDDLE_TIME_OBT = (data.START_TIME_OBT + data.STOP_TIME_OBT) * 0.5;    % NOTE: Adds additional field.
    data.probe_nbr = zeros(N_rows, 1) + probe_nbr;
end


% #############################################################################################


% Read IxL/IxH file
% -----------------
% WARNING: Relies on hardcoded column numbers.
% IxL and IxH files have the same format.
%
% =============================================================================================
% NOTE: An out-of-memory error has been observed here once on squid with output as below.
% The code was executed some weeks before 2015-06-11 for archive 1504 (May 2015).
% The line numbers could not be used since the code version had changed.
% THIS IMPLIES THAT THIS FUNCTION SHOULD BE OPTIMIZED WITH REGARDS TO MEMORY USE.
% Therefore tries to catch error locally when information is still available (e.g. file_path).
% -------------------------------------------------------------------------------------
% ....
%  Macroblock 40 out of  40.
%  Latest file created from 2015-04-30T23:56:45.123
%  Analysing sweeps
% 1 bad smoothening performance
% Downsample Low frequency measurements
% Generating Spectra
% Best estimates
%
% lapdog:best_estimates error message: Out of memory. Type HELP MEMORY for your options.
% best_estimates/read_IxLH_file_bias_voltage_INTERNAL, 839,
% best_estimates/main_INTERNAL, 142,
% best_estimates, 65,
% analysis, 92,
% lapdog, 113,
% analysis (incl. best_estimates): 32178 s (elapsed wall time)
% lapdog: generate LBL files....
% createLBL: 180 s (elapsed wall time)
% lapdog: DONE!
% moving derived archive to /data/LAP_ARCHIVE/
% moving edited& calibrated archives to /data/LAP_ARCHIVE
% removing archives from workfolder
% DONE!
% =============================================================================================
% Command-line experiment on memory use when reading file
% (all columns, double precision; middle column is unnecessarily string).
% ----------------------------------------------------------------------
% % -rw-r--r-- 1 ros1a rosetta 436M 2015-06-06 18.40:42 D09/RPCLAP_20150409_000150_807_I1H.TAB
%
% >> fid = fopen('/data/LAP_ARCHIVE/RO-C-RPCLAP-5-1504-DERIV-V0.3/2015/APR/D09/RPCLAP_20150409_000150_807_I1H.TAB', 'r');
% >> file_contents = textscan(fid, '%s%f%s%f%s', 'delimiter', ',');
% >> fc_1 = file_contents{1,1};
% >> fc_2 = file_contents{1,2};
% >> fc_3 = file_contents{1,3};
% >> fc_4 = file_contents{1,4};
% >> fc_5 = file_contents{1,5};
% >> whos file_contents fc_1 fc_2 fc_3 fc_4 fc_5
%   Name                     Size                 Bytes  Class     Attributes
%
%   fc_1               5499840x1              615982080  cell
%   fc_2               5499840x1               43998720  double
%   fc_3               5499840x1              475064408  cell
%   fc_4               5499840x1               43998720  double
%   fc_5               5499840x1              362989440  cell
%   file_contents            1x5             1542033668  cell                    // 1.5 GB!!!!
function data = read_IxLH_file_bias_voltage_INTERNAL(file_path, probe_nbr, memory_use_log_enabled)
    try
        fid = fopen(file_path, 'r');
        if fid < 0
            error('Can not read file: %s', file_path)
        end
        %fprintf(1, 'Reading file: %s\n', file_path)       % DEBUG / Log message
        
        % IMPLEMENTATION NOTE: Letting textscan parse numbers is much faster (about ~7 times)
        % than doing so manually with str2double after having read file into strings.
        % IxL files can be so large that speed matters.
        %
        % IMPLEMENTATION NOTE: Only reads the necessary columns and only at single precision to
        % reduce memory use. The lower precision (and hence lower memory use) does seem to
        % follow the values into other variables.
        % %f32 - read a number and convert to single
        % * - Ignore field, do not read
        file_contents = textscan(fid, '%*s%f32%*s%f32%*s', 'delimiter', ',');
        
        N_rows = length(file_contents{1});
        fclose(fid);
        
        %data.UTC_TIME = file_contents{1};    % For debugging. Can disable to reduce memory use.
        data.TIME_OBT = file_contents{1};    % HARDCODED COLUMN NUMBER
        data.V_bias   = file_contents{2};    % HARDCODED COLUMN NUMBER
        
        % Add extra fields that may be needed by algorithms.
        data.probe_nbr = zeros(N_rows, 1) + probe_nbr;
        %           t = tic;
        %           for i_row = 1:N_rows
        %               data.TIME_et(i_row, 1) = cspice_str2et(data.TIME_UTC{i_row});    % Very slow for large files.
        %           end
        %           toc(t)
        
        if memory_use_log_enabled
            fprintf(1, 'read_IxLH_file_bias_voltage_INTERNAL: End of function (try clause) - calling "whos file_contents"\n')
            whos file_contents   % DEBUG
        end
    catch err
        % Try catch error locally to try to give information on out-of-memory errors.
        
        fprintf(1,'\nlapdog: best_estimates error message: %s\n',err.message);
        
        len = length(err.stack);
        if (~isempty(len))
            for i=1:len
                fprintf(1,'%s, %i,\n', err.stack(i).name, err.stack(i).line);
            end
        end
        
        if memory_use_log_enabled
            fprintf(1, 'read_IxLH_file_bias_voltage_INTERNAL: End of function (catch clause) - calling "whos file_contents"\n')
            whos file_contents   % DEBUG
        end
        error('Error occurred when reading IxL/IxH file "%s".\n', file_path)
    end
end

% #############################################################################################

% Read BxS file
% -------------
% WARNING: Relies on hardcoded column numbers.
function [V_bias_min, V_bias_max] = read_BxS_min_max_bias_voltage_INTERNAL(file_path, probe_nbr)
    
    fid = fopen(file_path, 'r');
    if fid < 0
        warning(sprintf('Can not read file: %s', file_path))
    end
    %fprintf(1, 'Reading file: %s\n', file_path)       % DEBUG / Log message
    file_contents = textscan(fid, '%f%f', 'delimiter', ',');
    V_bias = file_contents{2};    % HARDCODED COLUMN NUMBER
    fclose(fid);
    
    V_bias_min = min(V_bias);
    V_bias_max = max(V_bias);
end

% #############################################################################################

% Generic utility function.
% s_list : 1D cell array, where every component is either a structs or empty.
% Every struct has the same set of fields of the same type.
% All fields within a struct are same-sized column vectors.
%
% NOTE: Treats empty matrices, [], as empty structures.
function s_merged = merge_structs_arrays_INTERNAL(s_list)
    % PROPOSAL: Use vararg instead of cell array.
    % PROPOSAL: Require empty structs (created with "struct" command), not empty matrices.
    %
    s_merged = [];
    for i = 1:length(s_list)
        
        if ~isempty(s_list{i})
            s = s_list{i};
            
            if isempty(s_merged)
                s_merged = s;
            else
                for fnc = fieldnames(s)'
                    fn = fnc{1};
                    s_merged.(fn) = [s_merged.(fn);  s.(fn)];
                end
            end
        end
        
    end   % for
end

% #############################################################################################

% Generic utility function.
% NOTE: Can be used for reordering struct fields.
function s = select_structs_arrays_INTERNAL(s, i)
    for fn = fieldnames(s)'
        s.(fn{1}) = s.(fn{1})(i, 1);
    end
end