Web Import now uses dataprep

2017-02-11 15:51:42 +01:00
parent f287f9af21
commit 8d9a8b0d2b
2 changed files with 176 additions and 245 deletions
--- a/rowers/dataprep.py
+++ b/rowers/dataprep.py
@@ -217,6 +217,116 @@ def timedeltaconv(x):
        
    return dt

+# Processes painsled CSV file to database
+def save_workout_database(f2,r,dosmooth=True,workouttype='rower',
+                          dosummary=True,title='Workout',
+                          notes='',totaldist=0,totaltime=0):
+    message = None
+    powerperc = 100*np.array([r.pw_ut2,
+                              r.pw_ut1,
+                              r.pw_at,
+                              r.pw_tr,r.pw_an])/r.ftp
+
+    # make workout and put in database
+    rr = rrower(hrmax=r.max,hrut2=r.ut2,
+		hrut1=r.ut1,hrat=r.at,
+		hrtr=r.tr,hran=r.an,ftp=r.ftp,
+                powerperc=powerperc,powerzones=r.powerzones)
+    row = rdata(f2,rower=rr)
+    if row == 0:
+	return (0,'Error: CSV data file not found')
+
+    if dosmooth:
+        # auto smoothing
+        pace = row.df[' Stroke500mPace (sec/500m)'].values
+        velo = 500./pace
+                
+        f = row.df['TimeStamp (sec)'].diff().mean()
+        windowsize = 2*(int(10./(f)))+1
+        if not 'originalvelo' in row.df:
+	    row.df['originalvelo'] = velo
+
+        if windowsize > 3 and windowsize<len(velo):
+	    velo2 = savgol_filter(velo,windowsize,3)
+        else:
+	    velo2 = velo
+
+        velo3 = pd.Series(velo2)
+        velo3 = velo3.replace([-np.inf,np.inf],np.nan)
+        velo3 = velo3.fillna(method='ffill')
+                
+        pace2 = 500./abs(velo3)
+        
+        row.df[' Stroke500mPace (sec/500m)'] = pace2
+
+        row.df = row.df.fillna(0)
+
+        row.write_csv(f2,gzip=True)
+        try:
+            os.remove(f2)
+        except:
+            pass
+                
+    # recalculate power data
+    if workouttype == 'rower' or workouttype == 'dynamic' or workouttype == 'slides':
+	try:
+	    row.erg_recalculatepower()
+            row.write_csv(f2,gzip=True)
+	except:
+	    pass
+            
+    averagehr = row.df[' HRCur (bpm)'].mean()
+    maxhr = row.df[' HRCur (bpm)'].max()
+    
+    if totaldist == 0:
+        totaldist = row.df['cum_dist'].max()
+    if totaltime == 0:
+        totaltime = row.df['TimeStamp (sec)'].max()-row.df['TimeStamp (sec)'].min()
+        totaltime = totaltime+row.df.ix[0,' ElapsedTime (sec)']
+
+
+    
+    hours = int(totaltime/3600.)
+    if hours>23:
+        message = 'Warning: The workout duration was longer than 23 hours'
+        hours = 23
+
+    minutes = int((totaltime - 3600.*hours)/60.)
+    seconds = int(totaltime - 3600.*hours - 60.*minutes)
+    tenths = int(10*(totaltime - 3600.*hours - 60.*minutes - seconds))
+    duration = "%s:%s:%s.%s" % (hours,minutes,seconds,tenths)
+
+    if dosummary:
+        summary = row.summary()
+        summary += '\n'
+        summary += row.intervalstats()
+
+    workoutdate = row.rowdatetime.strftime('%Y-%m-%d')
+    workoutstarttime = row.rowdatetime.strftime('%H:%M:%S')
+    workoutstartdatetime = thetimezone.localize(row.rowdatetime).astimezone(utc)
+
+    # check for duplicate start times
+    ws = Workout.objects.filter(starttime=workoutstarttime,
+				    user=r)
+    if (len(ws) != 0):
+	message =  "Warning: This workout probably already exists in the database"
+
+    w = Workout(user=r,name=title,date=workoutdate,
+		workouttype=workouttype,
+		duration=duration,distance=totaldist,
+		weightcategory=r.weightcategory,
+		starttime=workoutstarttime,
+		csvfilename=f2,notes=notes,summary=summary,
+		maxhr=maxhr,averagehr=averagehr,
+		startdatetime=workoutstartdatetime)
+
+    w.save()
+    # put stroke data in database
+    res = dataprep(row.df,id=w.id,bands=True,
+                   barchart=True,otwpower=True,empower=True)
+
+    return (w.id,message)
+
 # Create new workout from file and store it in the database
 # This routine should be used everywhere in views.py and mailprocessing.py
 # Currently there is code duplication
@@ -336,105 +446,14 @@ def new_workout_from_file(r,f2,
        except:
            os.remove(f_to_be_deleted+'.gz')

-    powerperc = 100*np.array([r.pw_ut2,
-                              r.pw_ut1,
-                              r.pw_at,
-                              r.pw_tr,r.pw_an])/r.ftp

-    # make workout and put in database
-    rr = rrower(hrmax=r.max,hrut2=r.ut2,
-		hrut1=r.ut1,hrat=r.at,
-		hrtr=r.tr,hran=r.an,ftp=r.ftp,
-                powerperc=powerperc,powerzones=r.powerzones)
-    row = rdata(f2,rower=rr)
-    if row == 0:
-	return (0,'Error: CSV data file not found')
+    dosummary = (fileformat != 'fit')
+    id,message = save_workout_database(f2,r,
+                                       workouttype=workouttype,
+                                       dosummary=dosummary,
+                                       title=title)

-    # auto smoothing
-    pace = row.df[' Stroke500mPace (sec/500m)'].values
-    velo = 500./pace
-                
-    f = row.df['TimeStamp (sec)'].diff().mean()
-    windowsize = 2*(int(10./(f)))+1
-    if not 'originalvelo' in row.df:
-	row.df['originalvelo'] = velo
-
-    if windowsize > 3 and windowsize<len(velo):
-	velo2 = savgol_filter(velo,windowsize,3)
-    else:
-	velo2 = velo
-
-    velo3 = pd.Series(velo2)
-    velo3 = velo3.replace([-np.inf,np.inf],np.nan)
-    velo3 = velo3.fillna(method='ffill')
-                
-    pace2 = 500./abs(velo3)
-
-    row.df[' Stroke500mPace (sec/500m)'] = pace2
-
-    row.df = row.df.fillna(0)
-
-    row.write_csv(f2,gzip=True)
-    try:
-        os.remove(f2)
-    except:
-        pass
-                
-    # recalculate power data
-    if workouttype == 'rower' or workouttype == 'dynamic' or workouttype == 'slides':
-	try:
-	    row.erg_recalculatepower()
-            row.write_csv(f2,gzip=True)
-	except:
-	    pass
-            
-    if fileformat != 'fit' and summary == '':
-	summary = row.summary()
-	summary += '\n'
-	summary += row.intervalstats_painsled()
-
-    averagehr = row.df[' HRCur (bpm)'].mean()
-    maxhr = row.df[' HRCur (bpm)'].max()
-    
-    totaldist = row.df['cum_dist'].max()
-    totaltime = row.df['TimeStamp (sec)'].max()-row.df['TimeStamp (sec)'].min()
-    totaltime = totaltime+row.df.ix[0,' ElapsedTime (sec)']
-
-    hours = int(totaltime/3600.)
-    if hours>23:
-        message = 'Warning: The workout duration was longer than 23 hours'
-        hours = 23
-
-    minutes = int((totaltime - 3600.*hours)/60.)
-    seconds = int(totaltime - 3600.*hours - 60.*minutes)
-    tenths = int(10*(totaltime - 3600.*hours - 60.*minutes - seconds))
-    duration = "%s:%s:%s.%s" % (hours,minutes,seconds,tenths)
-
-    workoutdate = row.rowdatetime.strftime('%Y-%m-%d')
-    workoutstarttime = row.rowdatetime.strftime('%H:%M:%S')
-    workoutstartdatetime = thetimezone.localize(row.rowdatetime).astimezone(utc)
-
-    # check for duplicate start times
-    ws = Workout.objects.filter(starttime=workoutstarttime,
-				    user=r)
-    if (len(ws) != 0):
-	message =  "Warning: This workout probably already exists in the database"
-
-    w = Workout(user=r,name=title,date=workoutdate,
-		workouttype=workouttype,
-		duration=duration,distance=totaldist,
-		weightcategory=r.weightcategory,
-		starttime=workoutstarttime,
-		csvfilename=f2,notes=notes,summary=summary,
-		maxhr=maxhr,averagehr=averagehr,
-		startdatetime=workoutstartdatetime)
-
-    w.save()
-    # put stroke data in database
-    res = dataprep(row.df,id=w.id,bands=True,
-                   barchart=True,otwpower=True,empower=True)
-
-    return (w.id,message)
+    return (id,message)

 # Compare the data from the CSV file and the database
 # Currently only calculates number of strokes. To be expanded with