Analyze Timing

analyze_timing

Attributes

logger `module-attribute`

logger = getLogger(__name__)

Functions

custom_erf

custom_erf(x, a, sigma, mu, b)

Source code in scripts/analyze_timing.py

def custom_erf(x, a, sigma, mu, b):
            return a * special.erf((x - mu) / (np.sqrt(2) * sigma)) + b

fit_irfs1

fit_irfs1(x_data, y_data, run_number=None, t_stage=None)

Source code in scripts/analyze_timing.py

def fit_irfs1(x_data, y_data, run_number=None, t_stage=None):

    def custom_erf(x, a, sigma, mu, b):
        return a * special.erf((x - mu) / (np.sqrt(2) * sigma)) + b

    # --- Convert & clean ---
    x_data = np.asarray(x_data, dtype=float)
    y_data = np.asarray(y_data, dtype=float)

    mask = np.isfinite(x_data) & np.isfinite(y_data)
    x_data = x_data[mask]
    y_data = y_data[mask]

    if len(x_data) < 8:
        raise ValueError("Not enough valid data points.")

    # --- Sort ---
    order = np.argsort(x_data)
    x_data = x_data[order]
    y_data = y_data[order]

    # --- Light smoothing to suppress noise (optional but helps a lot) ---
    from scipy.ndimage import gaussian_filter1d
    y_smooth = gaussian_filter1d(y_data, sigma=2)

    # --- Normalize robustly (avoid max spikes) ---
    y_min = np.percentile(y_smooth, 5)
    y_max = np.percentile(y_smooth, 95)

    if y_max - y_min == 0:
        raise ValueError("Data has no dynamic range.")

    y_norm = (y_data - y_min) / (y_max - y_min)

    # --- Automatic edge detection for mu guess ---
    dydx = np.gradient(y_smooth, x_data)
    mu_initial = x_data[np.argmax(np.abs(dydx))]

    # --- Better sigma guess ---
    x_span = x_data.max() - x_data.min()
    sigma_initial = x_span / 20

    # --- Amplitude & offset ---
    a_initial = 0.5
    b_initial = 0.5

    p0 = [a_initial, sigma_initial, mu_initial, b_initial]

    # --- Bounds (critical for stability) ---
    bounds = (
        [-2,  x_span/1000, x_data.min(), -1],   # lower
        [ 2,  x_span,      x_data.max(),  2]    # upper
    )

    try:
        popt, pcov = curve_fit(
            custom_erf,
            x_data,
            y_norm,
            p0=p0,
            bounds=bounds,
            maxfev=20000
        )
    except RuntimeError:
        raise RuntimeError("Fit failed to converge.")

    y_fit = custom_erf(x_data, *popt)

    # --- Plot ---
    plt.figure(figsize=(5, 3))
    plt.scatter(x_data, y_norm, s=15, label='Data')
    plt.plot(
        x_data,
        y_fit,
        label=f'Fitted IRF, FWHM = {abs(popt[1])*2.355:.4f} fs or units'
    )
    plt.xlabel('Delay')
    plt.ylabel('Normalized Signal')

    title = "Sigmoid Fit"
    if run_number is not None:
        title += f" | Run {run_number}"
    if t_stage is not None:
        title += f" | {t_stage}"

    plt.title(title)
    plt.legend()
    plt.grid()
    plt.tight_layout()
    plt.show()

    print("\nFitted Parameters:")
    print(f"FWHM [fs]  = {abs(popt[1])*2.355:.2f}")
    print(f"Center [ps]= {popt[2]:.4f}")
    print(f"Amplitude  = {popt[0]:.3f}")

    return popt, x_data, y_norm, y_fit

get_scan_motor

get_scan_motor(run)

Source code in scripts/analyze_timing.py

def get_scan_motor(run):
    # want to pick up the scanned motor automatically
    # wants the psana run object
    tmp = run.scaninfo
    ignore = {'step_value', 'step_docstring'}

    mot_name = next( k[0] for k in tmp if k[1] == 'raw' and k[0] not in ignore)
    logger.info(f'Scanning motor found as: {mot_name}')
    return mot_name

main

main(args)

Main entry point allowing external calls Entry point for console_scripts Args: args ([str]): command line parameter list

Source code in scripts/analyze_timing.py

def main(args):
    """
    Main entry point allowing external calls
    Entry point for console_scripts
    Args:
      args ([str]): command line parameter list
    """
    args = parse_args(args)
    if args.run_type == "proxy":
        proxy_jump(args.facility, args.experiment, args.run)
    elif args.run_type == "output":
        output(args.facility, args.experiment, args.run)

output

output(facility: str = 'S3DF', exp: str = None, run: str = None)

Generates the output of the timing scan.

Parameters: facility (str): Default: "S3DF". Options: "S3DF, NERSC exp (str): experiment number. Current experiment by default run (str): The run you'd like to process

Source code in scripts/analyze_timing.py

def output(
        facility: str = "S3DF",
        exp: str = None,
        run: str = None):
    """ Generates the output of the timing scan.

    Parameters:
        facility (str):
            Default: "S3DF". Options: "S3DF, NERSC
        exp (str):
            experiment number. Current experiment by default
        run (str):
            The run you'd like to process
    """
    qadc0_low = 10
    qadc0_high = 50
    qadc1_low = 74
    qadc1_high = 130

    # diode_0 = run.Detector('qadc_ch0')
    # diode_1 = run.Detector('qadc_ch1')

    # plt.plot(diode_0[qadc0_low:qadc0_high],label='qadc0')
    # plt.plot(diode_1[qadc1_low:qadc1_high],label='qadc1')
    # plt.legend()

    # Load all QADC data from XTC and save in a df
    experiment = exp
    run_numbers = [run]

    all_counts=[]
    evts=0
    qadc0_cropped = []
    qadc1_cropped = []
    time_mot = []
    x_ray_diode_sum = []
    dg3_sum = []
    x = []

    # want to pick up the scanned motor automatically
    def get_scan_motor(run):
        tmp = run.scaninfo
        ignore = {'step_value', 'step_docstring'}

        mot_name = next(k[0] for k in tmp if k[1] == 'raw' and k[0] not in ignore)
        print(f'Scanning motor found as: {mot_name}')
        return mot_name


    for run_number in run_numbers:
        logger.info(f'Processing run {run_number} for experiment {experiment}...')
        ds = DataSource(exp=experiment, run=int(run_number), xdetectors=['jungfrau'])

        for run in ds.runs():
            diode_0 = run.Detector('qadc_ch0')
            diode_1 = run.Detector('qadc_ch1')
            dg3_cam = run.Detector('alvium_dg3')  # camera

            t_stage = get_scan_motor(run)
            tmptmp = run.Detector(t_stage)
            ipm = run.Detector('MfxDg2BmMon')

            evts=0

            for i_evt, evt in enumerate(run.events()):
                evts+=1

                diode_val_0 = diode_0.raw.value(evt)
                diode_val_1 = diode_1.raw.value(evt)

                if diode_val_0 is not None and diode_val_1 is not None:

                    tmp0 = np.sum(np.abs(diode_val_0[qadc0_low:qadc0_high]))
                    tmp1 = np.sum(np.abs(diode_val_1[qadc1_low:qadc1_high]))

                    qadc0_cropped.append(tmp0)
                    qadc1_cropped.append(tmp1)

                    time_mot.append(tmptmp(evt))
                    x_ray_diode_sum.append(ipm.raw.totalIntensityJoules(evt))

                    # --- camera read with try ---
                    try:
                        img = dg3_cam.raw.value(evt)
                        if img is not None:
                            img_sum = np.sum(img)
                        else:
                            img_sum = np.nan
                    except Exception:
                        img_sum = np.nan

                    dg3_sum.append(img_sum)


        qadc0_cropped = np.array(qadc0_cropped)
        qadc1_cropped = np.array(qadc1_cropped)

        data = {
            't_position': time_mot,
            'qadc0_sum': qadc0_cropped,
            'qadc1_sum': qadc1_cropped,
            'x_ray_diode_sum': x_ray_diode_sum,
            'dg3_sum': dg3_sum
        }

        df = pd.DataFrame(data)

        df['normalized_laser'] = df['qadc1_sum']
        df['normalized_laser_dg3'] = df['dg3_sum']

        fig, axes = plt.subplots(1, 2, figsize=(10, 4), sharex=True)

        axes[0].scatter(df['t_position'], df['normalized_laser'], s=0.1)
        axes[0].set_title(f'Run: {run_number}, scanning: {t_stage}')
        axes[0].set_xlabel('time (ps?)')
        axes[0].set_ylabel('normalized laser')

        axes[1].scatter(df['t_position'], df['normalized_laser_dg3'], s=0.1)
        axes[1].set_title('DG3')
        axes[1].set_xlabel('time (ps?)')

        plt.tight_layout()
        plt.show()

        # Remove outliers and bin data
        diode_repsonse = 'normalized_laser_dg3' # could use normalized_laser_x_ray if X-ray normalization look sensible
        # --- Remove outliers using IQR on normalized_laser ---
        Q1 = df[diode_repsonse].quantile(0.25)
        Q3 = df[diode_repsonse].quantile(0.75)
        IQR = Q3 - Q1

        # Keep only points within 1.5 * IQR
        df_clean = df[(df[diode_repsonse] >= Q1 - 1.5 * IQR) &
                    (df[diode_repsonse] <= Q3 + 1.5 * IQR)]

        # --- Bin and plot ---
        n_bins = 100
        if t_stage == 'lxt_ttc' or t_stage == 'mfx_lxt_fast1' or t_stage == 'mfx_lxt_fast2':
            df_clean['t_bin'] = pd.cut(df_clean['t_position'].astype(float), bins=n_bins)
        else:
            df_clean['t_bin'] = pd.cut(df_clean['t_position'], bins=n_bins)

        binned = df_clean.groupby('t_bin').agg({
            't_position': 'mean',
             diode_repsonse: 'mean'
        })

        plt.scatter(binned['t_position'], binned[diode_repsonse], color='royalblue', s=40)
        plt.xlabel('t_position')
        plt.ylabel('normalized_laser')
        plt.title('Binned Scatter (Outliers Removed)')
        plt.grid(True)
        plt.show()

        # Now fit
        fit_irfs1(binned['t_position'], binned[diode_repsonse], run_number, t_stage)

parse_args

parse_args(args)

Parse command line parameters

Args: args ([str]): command line parameters as list of strings

Returns: :obj:argparse.Namespace: command line parameters namespace

Source code in scripts/analyze_timing.py

def parse_args(args):
    """Parse command line parameters

    Args:
      args ([str]): command line parameters as list of strings

    Returns:
      :obj:`argparse.Namespace`: command line parameters namespace
    """
    parser = argparse.ArgumentParser(
        description="startup script for cctbx on iana."
    )
    parser.add_argument(
        "--facility",
        "-f",
        dest="facility",
        default=None,
        help="Enter -f to specify facility",
    )
    parser.add_argument(
        "--type",
        "-t",
        dest="run_type",
        default=None,
        help="Enter -t to specify which step proxy or output",
    )
    parser.add_argument(
        "--experiment",
        "-e",
        dest="experiment",
        default=None,
        help="Enter -e to specify experiment number",
    )
    parser.add_argument(
        "--run",
        "-r",
        dest="run",
        default=None,
        help="Enter -r for the run you'd like to process."
    )
    return parser.parse_args(args)

proxy_jump

proxy_jump(facility: str = 'S3DF', exp: str = None, run: str = None)

Generates the output of the energy scan or series.

Parameters: facility (str): Default: "S3DF". Options: "S3DF, NERSC exp (str): experiment number. Current experiment by default run (str): The run you'd like to process

Source code in scripts/analyze_timing.py

def proxy_jump(
        facility: str = "S3DF",
        exp: str = None,
        run: str = None):
    """ Generates the output of the energy scan or series.

    Parameters:
        facility (str):
            Default: "S3DF". Options: "S3DF, NERSC
        exp (str):
            experiment number. Current experiment by default
        run (str):
            The run you'd like to process
    """
    if facility.upper() == "NERSC": #need paths to work on nersc
        exp = exp[3:-2]
        proc = [
                f"ssh -i ~/.ssh/cctbx -YAC cctbx@perlmutter-p1.nersc.gov "
                f"/global/common/software/lcls/mfx/scripts/cctbx/energy_calib_output.sh "
                f"{facility} {exp} {run}"
            ]
    elif facility.upper() == "S3DF":
        proc = [
            f"ssh -Yt psana '"
            f"source /sdf/group/lcls/ds/ana/sw/conda2/manage/bin/psconda.sh && "
            f"python /sdf/group/lcls/ds/tools/mfx/scripts/analyze_timing.py "
            f"-f {facility} -t output -e {exp} -r {run}'"
            ]
    else:
        logging.error(f"Facility not found: {facility}. Program Exit.")
        sys.exit()

    logging.info(proc)
    os.system(proc[0])

run

run()

Entry point for console_scripts

Source code in scripts/analyze_timing.py

def run():
    """Entry point for console_scripts"""
    main(sys.argv[1:])

Analyze Timing

analyze_timing

Attributes

logger module-attribute

Functions

custom_erf

fit_irfs1

get_scan_motor

main

output

parse_args

proxy_jump

run

logger `module-attribute`