add validated walker

joshuabmoore · joshuabmoore · commit 6b0f15a1b8a8 · 2025-07-18T12:48:23.000+10:00
diff --git a/README.md b/README.md
@@ -12,7 +12,7 @@ __11/07:__ 587 partialed functions, 2488 validated features
 
 __13/07:__ 623 partialed functions, 2673 validated features
 
-__18/07:__ 660 partialed functions, 2876 validated features
+__18/07:__ 660 partialed functions, 3044 validated features
 
 # Feature Conversion Progress...
-![](https://geps.dev/progress/41)
+![](https://geps.dev/progress/43)
diff --git a/pyhctsa/Configurations/basic.yaml b/pyhctsa/Configurations/basic.yaml
@@ -1494,4 +1494,22 @@ Physics:
         zscore: True
     hctsa_name: PH_ForcePotential
     ordered_args: ['whatPotential', 'params']
-    
+
+  Walker:
+    base_name: Walker
+    labels:
+      - physics
+      - dynamicalSystem
+    dependencies:
+    configs:
+      - walkerRule: 'prop'
+        walkerParams: [0.1, 0.5, 0.9, 1.1] 
+        zscore: True
+      - walkerRule: 'biasprop'
+        walkerParams: [[0.5, 0.1], [0.1, 0.5]] 
+        zscore: True
+      - walkerRule: 'momentum'
+        walkerParams: [2, 5]
+        zscore: True
+    hctsa_name: PH_Walker
+    ordered_args: ["walkerRule", "walkerParams"]
diff --git a/pyhctsa/Configurations/physics.yaml b/pyhctsa/Configurations/physics.yaml
@@ -13,4 +13,23 @@ Physics:
         params: [[3,0.5,1], [1,1,1], [10,0.04,10]]
         zscore: True
     hctsa_name: PH_ForcePotential
-    ordered_args: ['whatPotential', 'params']
+    ordered_args: ['whatPotential', 'params']
+  
+  Walker:
+    base_name: Walker
+    labels:
+      - physics
+      - dynamicalSystem
+    dependencies:
+    configs:
+      - walkerRule: 'prop'
+        walkerParams: [0.1, 0.5, 0.9, 1.1] 
+        zscore: True
+      - walkerRule: 'biasprop'
+        walkerParams: [[0.5, 0.1], [0.1, 0.5]] 
+        zscore: True
+      - walkerRule: 'momentum'
+        walkerParams: [2, 5]
+        zscore: True
+    hctsa_name: PH_Walker
+    ordered_args: ["walkerRule", "walkerParams"]
diff --git a/pyhctsa/Operations/Physics.py b/pyhctsa/Operations/Physics.py
@@ -2,6 +2,142 @@
 from typing import Union
 from numpy.typing import ArrayLike
 from pyhctsa.Operations.Correlation import FirstCrossing, AutoCorr
+from pyhctsa.Operations.Stationarity import SlidingWindow
+from scipy.stats import ansari, gaussian_kde
+from statsmodels.sandbox.stats.runs import runstest_1samp
+
+
+def Walker(y : ArrayLike, walkerRule : str = 'prop', walkerParams : Union[None, float, int, list] = None) -> dict:
+    """
+    Simulates a hypothetical walker moving through the time domain.
+
+    Note: due to differences in how the kde is implemented, exepct a discrepancy in the 
+    `sw_distdiff` feature.
+    """
+    N = len(y)
+
+    # Define default values and type requirements for each rule
+    WALKER_CONFIGS = {
+        'prop': {
+            'default': 0.5,
+            'valid_types': (int, float),
+            'error_msg': 'must be float or integer'
+        },
+        'biasprop': {
+            'default': [0.1, 0.2],
+            'valid_types': (list,),
+            'error_msg': 'must be a list'
+        },
+        'momentum': {
+            'default': 2,
+            'valid_types': (int, float),
+            'error_msg': 'must be float or integer'
+        }
+    }
+
+    if walkerRule not in WALKER_CONFIGS:
+        valid_rules = ", ".join(f"'{rule}'" for rule in WALKER_CONFIGS.keys())
+        raise ValueError(f"Unknown walker_rule: '{walkerRule}'. Choose from: {valid_rules}")
+    
+    # get configuration for the specified rule
+    config = WALKER_CONFIGS[walkerRule]
+
+    # use the default value if no parameters provided
+    if walkerParams is None:
+        walkerParams = config['default']
+
+    if not isinstance(walkerParams, config["valid_types"]):
+        raise ValueError(
+            f"walkerParams {config['error_msg']} for walker rule: '{walkerRule}'"
+        )
+    
+    # Do the walk
+    w = np.zeros(N)
+
+    if walkerRule == 'prop':
+        #  % walker starts at zero and narrows the gap between its position
+        #and the time series value at that point by the proportion given
+        #in walkerParams, to give the value at the subsequent time step
+        p = walkerParams
+        w[0] = 0 # start at zero
+        for i in range(1, N):
+            w[i] = w[i-1] + p * (y[i-1] - w[i-1])
+        
+    elif walkerRule == 'biasprop':
+        #walker is biased in one or the other direction (i.e., prefers to
+        # go up, or down). Requires a vector of inputs: [p_up, p_down]
+        pup, pdown = walkerParams
+
+        w[0] = 0
+        for i in range(1, N):
+            if y[i] > y[i-1]: # time series inceases
+                w[i] = w[i-1] + pup*(y[i-1]-w[i-1])
+            else:
+                w[i] = w[i-1] + pdown*(y[i-1]-w[i-1])
+    elif walkerRule == 'momentum':
+        #  % walker moves as if it had inertia from the previous time step,
+        # i.e., it 'wants' to move the same amount; the time series acts as
+        # a force changing its motion
+        m = walkerParams # 'inertial mass'
+
+        w[0] = y[0]
+        w[1] = y[1]
+        for i in range(2, N):
+            w_inert = w[i-1] + (w[i-1]-w[i-2])
+            w[i] = w_inert + (y[i]-w_inert)/m # dissipative term
+            #  % equation of motion (s-s_0=ut+F/m*t^2)
+            # where the 'force' F is the change in the original time series
+            # at that point
+    else:
+        raise ValueError(f"Unknown rule : {walkerRule}")
+    
+    # Get statistics on the walk
+    out = {}
+    # the walk itself
+    out['w_mean'] = np.mean(w)
+    out['w_median'] = np.median(w)
+    out['w_std'] = np.std(w, ddof=1)
+    out['w_ac1'] = AutoCorr(w, 1, 'Fourier')[0] # lag 1 autocorr
+    out['w_ac2'] = AutoCorr(w, 2, 'Fourier')[0] # lag 2 autocorr
+    out['w_tau'] = FirstCrossing(w, 'ac', 0, 'continuous')
+    out['w_min'] = np.min(w)
+    out['w_max'] = np.max(w)
+    # fraction of time series length that walker crosses time series
+    out['w_propzcross'] = (np.sum((w[:-1] * w[1:]) < 0)) / (N-1)
+
+    # Differences between the walk at signal
+    out['sw_meanabsdiff'] = np.mean(np.abs(y - w))
+    out['sw_taudiff'] = FirstCrossing(y, 'ac', 0, 'continuous') - FirstCrossing(w, 'ac', 0 , 'continuous')
+    out['sw_stdrat'] =  np.std(w, ddof=1)/np.std(y, ddof=1)
+    out['sw_ac1rat'] = out['w_ac1']/AutoCorr(y, 1)[0]
+    out['sw_minrat'] = np.min(w)/np.min(y)
+    out['sw_maxrat'] = np.max(w)/np.max(y)
+    out['sw_propcross'] = np.sum((w[:-1] - y[:-1]) * (w[1:] - y[1:]) < 0)/(N-1)
+
+    #% test from same distribution: Ansari-Bradley test
+    _, pval = ansari(w, y)
+    out['sw_ansarib_pval'] = pval
+
+    r = np.linspace(
+        min(min(y), min(w)),
+        max(max(y), max(w)),
+        200
+    )
+
+    kde_y = gaussian_kde(y)
+    kde_w = gaussian_kde(w)
+    dy = kde_y(r)
+    dw = kde_w(r)
+    out['sw_distdiff'] = np.sum(np.abs(dy - dw))
+
+    #% (iii) Looking at residuals between time series and walker
+    res = w - y
+    _, runs_pval = runstest_1samp(res, cutoff='mean')
+    out['res_runstest'] = runs_pval
+    out['res_swss5_1'] = SlidingWindow(res, 'std', 'std', 5, 1) # sliding window stationarity
+    out['res_ac1'] = AutoCorr(res, 1)[0] # auto correlation at lag-1
+
+    return out
 
 
 def ForcePotential(y : ArrayLike, whatPotential : str = 'dblwell', params : Union[list, None] = None) -> dict: