fligt
diff --git a/‎notebooks/30_parsing-bytes.ipynb
+58-77 b/‎notebooks/30_parsing-bytes.ipynb
+58-77
@@ -910,7 +910,7 @@
     {
      "data": {
       "text/plain": [
-       "'hi-3i9f7hfhfhfhf8hfhi-S-h-Z'"
+       "'hi-3i9f7hfhfhfhf8hfhi-*Z'"
       ]
      },
      "execution_count": null,
@@ -934,6 +934,13 @@
    "id": "d38a5b21-8a4f-4191-8f39-9e8ec4312191",
    "metadata": {},
    "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[b'\\x0cRoHS 50 Hi-Z\\x01']\n"
+     ]
+    },
     {
      "data": {
       "text/html": [
@@ -1157,18 +1164,13 @@
        "    </tr>\n",
        "    <tr>\n",
        "      <th>39</th>\n",
-       "      <td>RoHS 50 Hi-Z</td>\n",
-       "      <td>TubeSpec?</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>40</th>\n",
-       "      <td>1</td>\n",
+       "      <td>[b'\\x0cRoHS 50 Hi-Z\\x01']</td>\n",
        "      <td>??</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th>41</th>\n",
+       "      <th>40</th>\n",
        "      <td>[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 6, ...</td>\n",
-       "      <td>2048 counts</td>\n",
+       "      <td>Intensity_2048_channels</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
@@ -1215,9 +1217,8 @@
        "36                                             1017.0   \n",
        "37                                               2048   \n",
        "38                                                 38   \n",
-       "39                                       RoHS 50 Hi-Z   \n",
-       "40                                                  1   \n",
-       "41  [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 6, ...   \n",
+       "39                          [b'\\x0cRoHS 50 Hi-Z\\x01']   \n",
+       "40  [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 6, ...   \n",
        "\n",
        "                        param_keys  \n",
        "0                       block_type  \n",
@@ -1259,9 +1260,8 @@
        "36         NosePressureInMilliBars  \n",
        "37                NumberOfChannels  \n",
        "38              NoseTemperatureInC  \n",
-       "39                       TubeSpec?  \n",
-       "40                              ??  \n",
-       "41                     2048 counts  "
+       "39                              ??  \n",
+       "40         Intensity_2048_channels  "
       ]
      },
      "metadata": {},
@@ -1394,6 +1394,8 @@
    "source": [
     "#|export \n",
     "\n",
+    "# 'hi-3i9f7hfhfhfhf8hfhi-S-h-Z'\n",
+    "\n",
     "PDZ_25_STRUCTURE_DICT = {\n",
     "    25:  {'xformat': 'hi-10X-i', \n",
     "          'param_keys': ['pdz_type', 'block_size', 'FileFormatString?', '??']}, \n",
@@ -1404,7 +1406,7 @@
     "          'param_keys': ['block_type', 'block_size', '??', 'RawCounts', 'ValidCounts', '??', '??', \n",
     "                         '??', 'ActiveTimeInSeconds', 'DeadTimeInSeconds', 'ResetTimeInSeconds', \n",
     "                         'LiveTimeInSeconds', 'TotalElapsedTimeInSeconds', '??']}, \n",
-    "    3:   {'xformat': 'hi-3i9f7hfhfhfhf8hfhi-S-h-Z', \n",
+    "    3:   {'xformat': 'hi-3i9f7hfhfhfhf8hfhi-*Z', \n",
     "          'param_keys': ['block_type', 'block_size', '??', 'RawCounts', 'ValidCounts', \n",
     "                         '??', '??', '??', 'ActiveTimeInSeconds', 'DeadTimeInSeconds', \n",
     "                         'ResetTimeInSeconds', 'LiveTimeInSeconds', 'XrayVoltageInkV', 'XrayFilamentCurrentInMicroAmps', \n",
@@ -1413,61 +1415,10 @@
     "                         '??', '??', 'eVPerChannel', '??', 'eVStart', \n",
     "                         'Year', 'Month', 'AM/PM code?', 'Day', 'Hour', 'Minutes', 'Seconds', \n",
     "                         '??', 'NosePressureInMilliBars', 'NumberOfChannels', 'NoseTemperatureInC', \n",
-    "                         'TubeSpec?', '??', '2048 counts']}}\n",
+    "                         '??', 'Intensity_2048_channels']}}\n",
     "\n",
+    "# moved extract_spectra() function to legacy module \n",
     "\n",
-    "def extract_spectra(pdz_file, to_csv=True, verbose=True): \n",
-    "    '''Directly extract spectral data from `pdz_file`. \n",
-    "    \n",
-    "    Robust extraction of spectrum counts and energy calibration. Other meta data is ignored. '''\n",
-    "\n",
-    "    pdz_bytes = file_to_bytes(pdz_file)\n",
-    "    block_list = get_blocks(pdz_bytes, verbose=False) \n",
-    "    \n",
-    "    # select type 3 blocks\n",
-    "    b3_list = [b for b in block_list if b['block_type'] == 3] \n",
-    "    n_spectra = len(b3_list) \n",
-    "\n",
-    "    # parsing spectrum parameters \n",
-    "    #from first block to compute channel energies (keV) \n",
-    "    # (assuming that these are similar for all spectra in the pdz file) \n",
-    "    \n",
-    "    arr = b3_list[0]['bytes'] # only using first spectrum!  \n",
-    "    spectrum_params = multiparse('hi-3i9f7hfhfhfhf8hfhi-S-h', arr, verbose=False)[0]  \n",
-    "    tube_keV = spectrum_params[12] # FYI \n",
-    "    delta_keV = spectrum_params[25] / 1000\n",
-    "    start_keV = spectrum_params[27] / 1000 \n",
-    "    n_channels = spectrum_params[37] \n",
-    "    if n_channels != 2048: \n",
-    "        print(f'Found unexpected number of channels in pdz metadata: {n_channels}')\n",
-    "        \n",
-    "    stop_keV = start_keV + delta_keV * (n_channels -1)\n",
-    "    x_keV = np.linspace(start_keV, stop_keV, num=n_channels) \n",
-    "\n",
-    "    # initialize array \n",
-    "    \n",
-    "    spectra_df = pd.DataFrame(index=x_keV)\n",
-    "\n",
-    "    # TODO: Test if computed channel energies `x_keV` are reasonable, \n",
-    "    # Parsing of spectrum parameters might fail \n",
-    "    # if Bruker messes with file format.   \n",
-    "    # otherwise fall back on 0-40 keV range  \n",
-    "\n",
-    "    spectrum_list = [] \n",
-    "\n",
-    "    for i, b3 in enumerate(b3_list):  \n",
-    "        arr = b3['bytes'] \n",
-    "        counts = np.array(parse(f'{n_channels}i', arr[-4*n_channels:], verbose=False)[0])  \n",
-    "\n",
-    "        spectra_df[f'spectrum #{i+1}'] = counts\n",
-    "\n",
-    "    if to_csv == True: \n",
-    "        csv_file = f'{pdz_file}.csv' \n",
-    "        print(f'Saving spectral data to: {csv_file}')\n",
-    "        spectra_df.to_csv(csv_file, float_format='%10.5f')\n",
-    "\n",
-    "    return spectra_df\n",
-    "           \n",
     "\n",
     "def multiparse(xformat, arr, param_keys=None, verbose=True): \n",
     "    '''Parse segments in extendend format string `xformat` e.g. '<i5f-2S-T-3S-S-f' '''\n",
@@ -1483,11 +1434,35 @@
     "            result, arr = read_table(p, arr, verbose=False) \n",
     "        elif 'X' in p: \n",
     "            result, arr = skip_bytes(p, arr, verbose=False) \n",
-    "        elif 'Z' in p: \n",
+    "            \n",
+    "        # four spectral data scenarios here: \n",
+    "\n",
+    "        # (1) 2048 channels at end of array and skip any bytes before\n",
+    "        elif p == '*Z': \n",
+    "            # split array  \n",
+    "            n_channels = 2048 \n",
+    "            arr_0 = arr[:-n_channels*4] # head \n",
+    "            arr_1 = arr[-n_channels*4:] # tail             \n",
+    "            skipped, _ = skip_bytes('*X', arr_0, verbose=False)\n",
+    "            counts, arr = read_counts('Z', arr_1 , verbose=False) # arr should now be empty \n",
+    "            result = [skipped, counts]             \n",
+    "        # (2) 1024 channels at end of array and skip any bytes before\n",
+    "        elif p == '*z': \n",
+    "            # split array  \n",
+    "            n_channels = 1024 \n",
+    "            arr_0 = arr[:-n_channels*4] # head \n",
+    "            arr_1 = arr[-n_channels*4:] # tail \n",
+    "            \n",
+    "            skipped, _ = skip_bytes('*X', arr_0, verbose=False)\n",
+    "            counts, arr = read_counts('z', arr_1 , verbose=False) # arr should now be empty \n",
+    "            result = [skipped, counts]             \n",
+    "        # (3) 2048 channels not at end of array \n",
+    "        elif p == 'Z': \n",
     "            result, arr = read_counts(p, arr, verbose=False)\n",
     "            result = [result]\n",
-    "        elif 'z' in p: \n",
-    "            result, arr = read_counts(p, arr, n_channels=1028, verbose=False)\n",
+    "        # (4) 1024 channels not at end of array \n",
+    "        elif p == 'z': \n",
+    "            result, arr = read_counts(p, arr, verbose=False)\n",
     "            result = [result]    \n",
     "        \n",
     "        else: \n",
@@ -1620,14 +1595,20 @@
     "    return table, arr\n",
     "\n",
     "\n",
-    "def read_counts(xformat, arr, n_channels=2048, verbose=True): \n",
+    "def read_counts(xformat, arr, verbose=True): \n",
     "    '''Extract counts. '''\n",
     "\n",
-    "    assert xformat == 'Z'  or xformat == 'z', 'Incorrect format string'\n",
-    "\n",
-    "    format = f'<{n_channels}i'\n",
+    "    assert xformat == 'Z'  or xformat == 'z', 'Incorrect spectral data format string. Should be `Z` or `z`' \n",
+    "    \n",
+    "    if xformat == 'Z': \n",
+    "        n_channels = 2048 \n",
+    "    elif xformat == 'z': \n",
+    "        n_channels = 1024 \n",
+    "        \n",
+    "    # make struct compatible format string \n",
+    "    _format = f'<{n_channels}i'\n",
     "\n",
-    "    counts, arr = parse(format, arr, verbose=False) \n",
+    "    counts, arr = parse(_format, arr, verbose=False) \n",
     "    counts = np.array(counts)\n",
     "        \n",
     "    if verbose: \n",