import pandas as pd
import matplotlib
import matplotlib.pyplot as plt
import pylab as pl
from scipy.signal import find_peaks
import glob
import re
matplotlib.style.use('ggplot')
%matplotlib inline


files = glob.glob('data/Steps-Logs/*.csv')
for f in files:
    print(f)

data/Steps-Logs/D8_righthoodiepocket.csv
data/Steps-Logs/D2_leftwrist_slow.csv
data/Steps-Logs/D3_leftwrist.csv
data/Steps-Logs/D9_rightpocket_slow.csv
data/Steps-Logs/D6_leftwrist3_slow.csv
data/Steps-Logs/D5_leftwrist2_slow.csv
data/Steps-Logs/D1_lefthoodiepocket.csv
data/Steps-Logs/D4_leftwrist_3hops_3halfspin_3touchceiling_thenshake.csv
data/Steps-Logs/D7_righthoodiepocket_slow.csv


files = glob.glob('data/Steps-Logs/*.csv')

SAMPLING_RATE = 50.0  # sample rate, Hz
results = []

# set height, prominence and distance parameters
ht = 10000
prom = 0.1
dist = SAMPLING_RATE/2  # Corresponds to two steps per second, assuming it's unlikely for a person to take more than two steps every second.

for f in files:

    # Load data
    df = pd.read_csv(f, index_col='time', parse_dates=True)  
    
    # Detect peaks
    peaks, _ = find_peaks(df['accel_mag'], height=ht, prominence=prom, distance=dist)
    num_steps = len(peaks)
    
    # Parse filename to extract ID
    match = re.search(r'D(\d+)', f)
    id = match.group(1)
    
    # Get ground truth
    actual_steps = 45
        
    # Calculate accuracy       
    accuracy = num_steps/actual_steps*100
    
    # Store results 
    results.append([id, actual_steps, num_steps, accuracy])
    
# Print table   
print("{:>10}  {:>10}  {:>10}  {:>10}".format('ID', 'Actual', 'Detected', 'Accuracy'))
for row in results:
    print("{:>10}  {:>10}  {:>10}  {:>10.2f}".format(*row))

        ID      Actual    Detected    Accuracy
         8          45          73      162.22
         2          45          25       55.56
         3          45          59      131.11
         9          45          27       60.00
         6          45          25       55.56
         5          45          34       75.56
         1          45          84      186.67
         4          45         201      446.67
         7          45          22       48.89


# Load data and detect peaks
files_to_plot = glob.glob('data/Steps-Logs/D*.csv')

for i, f in enumerate(files_to_plot):
    df = pd.read_csv(f, index_col='time', parse_dates=True)  
    
    # Step counting algorithm
    peaks_indices = find_peaks(df['accel_mag'], height=ht, prominence=prom, distance=dist)[0]
    peaks = df['accel_mag'][peaks_indices]

    # Plot the signal and mark the points where your algorithm detects steps
    plt.figure(figsize=(10,5))

    time_axis = df.index[peaks_indices]

    pl.plot(time_axis, peaks, 'rx')
    pl.plot(df.index, df['accel_mag'], 'g-', label = 'filtered')
    plt.title(f)
    plt.grid()
    plt.show()

Example: Step counting¶

Using find_peaks to Detect Steps¶