more flat

Chen Xie · Chen Xie · commit a30ff5e35155 · 2016-08-29T11:45:57.000-04:00
diff --git a/devtests.ipynb b/devtests.ipynb
@@ -9,11 +9,26 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {
     "collapsed": false
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[[ 988]\n",
+      " [ 990]\n",
+      " [ 989]\n",
+      " ..., \n",
+      " [ 951]\n",
+      " [ 957]\n",
+      " [1024]]\n",
+      "649886\n"
+     ]
+    }
+   ],
    "source": [
     "import numpy as np\n",
     "from wfdb import rdsamp\n",
@@ -138,11 +153,38 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {
     "collapsed": false
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[[ nan  nan]\n",
+      " [ nan  nan]\n",
+      " [ nan  nan]\n",
+      " ..., \n",
+      " [-21.  nan]\n",
+      " [-21.  nan]\n",
+      " [-20.  nan]]\n",
+      "(10000, 2)\n",
+      "\n",
+      "\n",
+      "\n",
+      "{'nsampseg': [0, 3261, 6750, 125, 1354, 512, 906259, 2604, 1304941, 1280, 512, 2210767, 172500, 5760000, 157500, 3900000, 4425, 18075, 7500, 37500, 22500], 'nsig': 4, 'fmt': [], 'fs': 125.0, 'nseg': 21, 'nsamp': 14518365, 'signame': [], 'units': [], 'skew': [], 'baseline': [], 'sampsperframe': [], 'initvalue': [], 'gain': [], 'comments': [' <age>: 60 <sex>: F'], 'basedate': '10/10/2896', 'filename': ['3975656_layout', '~', '3975656_0001', '3975656_0002', '3975656_0003', '3975656_0004', '3975656_0005', '~', '3975656_0006', '3975656_0007', '3975656_0008', '3975656_0009', '~', '3975656_0010', '~', '3975656_0011', '3975656_0012', '3975656_0013', '3975656_0014', '3975656_0015', '3975656_0016'], 'byteoffset': [], 'basetime': '00:31:25.894'}\n",
+      "\n",
+      "\n",
+      "\n",
+      "{'nsampseg': [], 'nsig': 4, 'fmt': ['0', '0', '0', '0'], 'fs': 125.0, 'nseg': 1, 'nsamp': 0, 'signame': ['II', 'V', 'MCL1', 'ABP'], 'units': ['mV', 'mV', 'mV', 'mmHg'], 'skew': [0, 0, 0, 0], 'baseline': [0, 0, 0, 0], 'sampsperframe': [1, 1, 1, 1], 'initvalue': [-16384, -8192, -1024, -256], 'gain': [83.0, 55.0, 122.0, 1.0], 'comments': [], 'basedate': '', 'filename': ['~', '~', '~', '~'], 'byteoffset': [0, 0, 0, 0], 'basetime': '31:25.894'}\n",
+      "\n",
+      "\n",
+      "\n",
+      "['Empty Segment', {'nsampseg': [], 'nsig': 1, 'fmt': ['80', 'No Channel'], 'fs': 125.0, 'nseg': 1, 'nsamp': 6750, 'signame': ['V', 'No Channel'], 'units': ['mV', 'No Channel'], 'skew': [0, 'No Channel'], 'baseline': [0, 'No Channel'], 'sampsperframe': [1, 'No Channel'], 'initvalue': [0, 'No Channel'], 'gain': [1.0, 'No Channel'], 'comments': [], 'basedate': '', 'filename': ['3975656_0001.dat', 'No Channel'], 'byteoffset': [0, 'No Channel'], 'basetime': '31:51.982'}]\n"
+     ]
+    }
+   ],
    "source": [
     "# Testing rdsamp multi-segment variable layout record - stacksegments\n",
     "import numpy as np\n",
@@ -214,7 +256,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {
     "collapsed": false
    },
diff --git a/wfdb/_rdsamp.py b/wfdb/_rdsamp.py
@@ -859,61 +859,9 @@ def loadconfig(fn):
             pass
     return config
 
-def rdsamp(
-        recordname,
-        sampfrom=0,
-        sampto=[],
-        channels=[],
-        physical=1,
-        stacksegments=1):
-    """Read a WFDB record and return the signal as a numpy array and the metadata as a dictionary.
-
-    Usage:
-    sig, fields = rdsamp(recordname, sampfrom, sampto, channels, physical, stacksegments)
-
-    Input arguments:
-    - recordname (required): The name of the WFDB record to be read (without any file extensions).
-    - sampfrom (default=0): The starting sample number to read for each channel.
-    - sampto (default=length of entire signal): The final sample number to read for each channel.
-    - channels (default=all channels): Indices specifying the channel to be returned.
-    - physical (default=1): Flag that specifies whether to return signals in physical (1) or digital (0) units.
-    - stacksegments (default=1): Flag used only for multi-segment files. Specifies whether to return the signal as a single stacked/concatenated numpy array (1) or as a list of one numpy array for each segment (0).
-
-
-    Output variables:
-    - sig: An nxm numpy array where n is the signal length and m is the number of channels. 
-      If the input record is a multi-segment record, depending on the input stacksegments flag, 
-      sig will either be a single stacked/concatenated numpy array (1) or a list of one numpy 
-      array for each segment (0). For empty segments, stacked format will contain Nan values, 
-      and non-stacked format will contain a single integer specifying the length of the empty segment.
-    - fields: A dictionary of metadata about the record extracted or deduced from the header/signal file. 
-      If the input record is a multi-segment record, the output argument will be a list of dictionaries:
-              : The first list element will be a dictionary of metadata about the master header.
-              : If the record is in variable layout format, the next list element will be a dictionary 
-                of metadata about the layout specification header.
-              : The last list element will be a list of dictionaries of metadata for each segment. 
-                For empty segments, the dictionary will be replaced by a single string: 'Empty Segment'
-    """
-
-    filestoremove = []
-    config = loadconfig('wfdb.config')
-
-    if config.get('pbdownload','getpbfiles') == 1:  # Flag specifying whether to allow downloading from physiobank
-        recordname, dledfiles = checkrecordfiles(recordname, os.getcwd())
-    
-    if int(config.get('pbdownload','keepdledfiles')) == 0:  # Flag specifying whether to keep downloaded physiobank files
-        filestoremove = dledfiles
-
-    fields = readheader(recordname)  # Get the info from the header file
 
-    if fields["nsig"] == 0:
-        sys.exit("This record has no signals. Use rdann to read annotations")
-    if sampfrom < 0:
-        sys.exit("sampfrom must be non-negative")
-    dirname, baserecordname = os.path.split(recordname)
-
-    if fields["nseg"] == 1:  # single segment file
-        if (len(set(fields["filename"])) ==
+def processsegment(fields, dirname, baserecordname, sampfrom, sampto, channels, physical):
+    if (len(set(fields["filename"])) ==
                 1):  # single dat (or binary) file in the segment
             # Signal length was not specified in the header, calculate it from
             # the file size.
@@ -967,8 +915,8 @@ def rdsamp(
                 sig = np.subtract(sig, np.array(
                     [float(i) for i in fields["baseline"]]))
                 sig = np.divide(sig, np.array([fields["gain"]]))
-
-        else:  # Multiple dat files in the segment. Read different dats and merge them channel wise.
+                
+    else:  # Multiple dat files in the segment. Read different dats and merge them channel wise.
 
             if not channels:  # Default all channels
                 channels = list(range(0, fields["nsig"]))
@@ -1055,15 +1003,12 @@ def rdsamp(
                         fields["fmt"][ch]], ch] = np.nan
                 sig = np.subtract(sig, np.array(
                     [float(b) for b in fields["baseline"]]))
-                sig = np.divide(sig, np.array([fields["gain"]]))
+                sig = np.divide(sig, np.array([fields["gain"]]))    
+                
+    return sig, fields
 
-    # Multi-segment file. Preprocess and recursively call rdsamp on single
-    # segments.
-    else:
-
-        # Determine if this record is fixed or variable layout. startseg is the
-        # first signal segment.
-        if fields["nsampseg"][
+def fixedorvariable:
+    if fields["nsampseg"][
                 0] == 0:  # variable layout - first segment is layout specification file
             startseg = 1
             # Store the layout header info.
@@ -1073,6 +1018,75 @@ def rdsamp(
                     fields["filename"][0]))
         else:  # fixed layout - no layout specification file.
             startseg = 0
+            layoutfields=[]
+    return startseg, layoutfields
+
+def rdsamp(
+        recordname,
+        sampfrom=0,
+        sampto=[],
+        channels=[],
+        physical=1,
+        stacksegments=1):
+    """Read a WFDB record and return the signal as a numpy array and the metadata as a dictionary.
+
+    Usage:
+    sig, fields = rdsamp(recordname, sampfrom, sampto, channels, physical, stacksegments)
+
+    Input arguments:
+    - recordname (required): The name of the WFDB record to be read (without any file extensions).
+    - sampfrom (default=0): The starting sample number to read for each channel.
+    - sampto (default=length of entire signal): The final sample number to read for each channel.
+    - channels (default=all channels): Indices specifying the channel to be returned.
+    - physical (default=1): Flag that specifies whether to return signals in physical (1) or digital (0) units.
+    - stacksegments (default=1): Flag used only for multi-segment files. Specifies whether to return the signal as a single stacked/concatenated numpy array (1) or as a list of one numpy array for each segment (0).
+
+
+    Output variables:
+    - sig: An nxm numpy array where n is the signal length and m is the number of channels. 
+      If the input record is a multi-segment record, depending on the input stacksegments flag, 
+      sig will either be a single stacked/concatenated numpy array (1) or a list of one numpy 
+      array for each segment (0). For empty segments, stacked format will contain Nan values, 
+      and non-stacked format will contain a single integer specifying the length of the empty segment.
+    - fields: A dictionary of metadata about the record extracted or deduced from the header/signal file. 
+      If the input record is a multi-segment record, the output argument will be a list of dictionaries:
+              : The first list element will be a dictionary of metadata about the master header.
+              : If the record is in variable layout format, the next list element will be a dictionary 
+                of metadata about the layout specification header.
+              : The last list element will be a list of dictionaries of metadata for each segment. 
+                For empty segments, the dictionary will be replaced by a single string: 'Empty Segment'
+    """
+
+    filestoremove = []
+    config = loadconfig('wfdb.config')
+
+    if config.get('pbdownload','getpbfiles') == 1:  # Flag specifying whether to allow downloading from physiobank
+        recordname, dledfiles = checkrecordfiles(recordname, os.getcwd())
+    
+    if int(config.get('pbdownload','keepdledfiles')) == 0:  # Flag specifying whether to keep downloaded physiobank files
+        filestoremove = dledfiles
+
+        
+    fields = readheader(recordname)  # Get the info from the header file
+
+    
+    if fields["nsig"] == 0:
+        sys.exit("This record has no signals. Use rdann to read annotations")
+    if sampfrom < 0:
+        sys.exit("sampfrom must be non-negative")
+    dirname, baserecordname = os.path.split(recordname)
+
+    
+    if fields["nseg"] == 1:  # single segment file
+        sig, fields = processsegment(fields, dirname, baserecordname, sampfrom, sampto, channels, physical)
+
+    # Multi-segment file. Preprocess and recursively call rdsamp on single
+    # segments.
+    else:
+            
+        # Determine if this record is fixed or variable layout. startseg is the
+        # first signal segment.    
+        startseg, layoutfields = fixedorvariable(fields)
 
         # Determine the segments and samples that have to be read based on
         # sampfrom and sampto