import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from scipy.optimize import curve_fit
from scipy.signal import correlate
from scipy.fft import fft

data_dir = '../data/misc'
data = []
i = 0
t0 = pd.Timestamp('2023-01-01 00:00:00').timestamp()

with open(f'{data_dir}/whitby_tides.txt') as f:
    lines = f.readlines()

for line in lines[11:]:
    if not line.strip():
        continue # Skip any empty lines
    try:
        time = (pd.Timestamp(line[8:27]).timestamp() - t0) / 3600
    except:
        # Skip any lines that do not have a valid time
        continue
    level = float(line[28:37])
    residual = float(line[38:48])
    if level <= -99:
        # Missing is indicated by a tide level of -99; skip these lines
        continue
    data.append([time, level, residual])

df = pd.DataFrame(data, columns=['time', 'level', 'residual'])
df

def plot_days(start_day, end_day, values = None, ax = None):
    start_time = start_day * 24
    end_time = end_day * 24
    if values is None:
        values = df['level']
    if ax is None:
        fig, ax = plt.subplots(figsize=(15, 6))
    mask = (df['time'] >= start_time) & (df['time'] <= end_time)
    ax.plot(df['time'][mask], values[mask])
    for d in range(start_day, end_day + 1):
        ax.axvline(x=d * 24, color='r', linestyle='--')
    ax.set_xlabel('Time (hours)')
    ax.set_ylabel('Tide level')

plot_days(100,110)

tau = [
 12.4206012,  # Principal lunar semidiurnal
 12,          # Principal solar semidiurnal
 12.65834751, # Larger lunar elliptic semidiurnal
 23.93447213, # Lunar diurnal
 6.210300601, # Shallow water overtides of principal lunar
 25.81933871, # Lunar diurnal
 4.140200401, # Shallow water overtides of principal lunar
 8.177140247, # Shallow water terdiurnal
 6            # Shallow water overtides of principal solar
]

omega = 2*np.pi/np.array(tau)

a0 = np.zeros(1 + 2 * len(omega))

def p_short(t, *a):
   return (a[0] +
           (a[1::2] * np.cos(omega * np.expand_dims(t,-1))).sum(axis=-1) + 
           (a[2::2] * np.sin(omega * np.expand_dims(t,-1))).sum(axis=-1))

def p_long(t, a0,a1,a2,a3,a4,a5,a6,a7,a8,a9,a10,a11,a12,a13,a14,a15,a16,a17,a18): 
   return (a0 + 
           a1  * np.cos(omega[0] * t) + a2  * np.sin(omega[0] * t) + 
           a3  * np.cos(omega[1] * t) + a4  * np.sin(omega[1] * t) + 
           a5  * np.cos(omega[2] * t) + a6  * np.sin(omega[2] * t) + 
           a7  * np.cos(omega[3] * t) + a8  * np.sin(omega[3] * t) + 
           a9  * np.cos(omega[4] * t) + a10 * np.sin(omega[4] * t) + 
           a11 * np.cos(omega[5] * t) + a12 * np.sin(omega[5] * t) + 
           a13 * np.cos(omega[6] * t) + a14 * np.sin(omega[6] * t) + 
           a15 * np.cos(omega[7] * t) + a16 * np.sin(omega[7] * t) + 
           a17 * np.cos(omega[8] * t) + a18 * np.sin(omega[8] * t))

p = p_short

ts = df['time'].to_numpy()
ys = df['level'].to_numpy()
fit = curve_fit(p, ts, ys, p0 = a0, xtol=1e-11, maxfev=10000, full_output=True)
aa = fit[0]
print(f"Optimal constant: {aa[0]}")
print(f"Optimal amplitudes: {aa[1::2]}")
print(f"Optimal phases: {aa[2::2]}")
zs = p(ts, *aa)

Optimal constant: 3.5421270902565114
Optimal amplitudes: [ 1.19256096e+00 -4.73221830e-01  2.97558451e-01 -6.00008931e-02
 -2.15307734e-02  1.02415961e-01  1.30216449e-03 -1.12941008e-03
 -5.97073492e-03]
Optimal phases: [-1.07817045  0.30676206  0.10903037 -0.12935731  0.01330247 -0.1286847
 -0.01046758  0.01039158  0.0015952 ]

N0 = 8000
N1 = 12000
fig, ax = plt.subplots(figsize=(15, 6))
ax.plot(ts[N0:N1], ys[N0:N1], color='blue')
ax.plot(ts[N0:N1], zs[N0:N1], color='red')

[<matplotlib.lines.Line2D at 0x2a5119b9810>]

def p_phase(t, *a):
   c = a[0]
   amplitude = a[1::2]
   phase = a[2::2]
   return (amplitude * np.sin(omega * np.expand_dims(t,-1) + phase)).sum(axis=-1) + c

	time	level	residual
0	0.00	5.036	0.365
1	0.25	4.919	0.357
2	0.50	4.810	0.373
3	0.75	4.662	0.364
4	1.00	4.506	0.357
...	...	...	...
34937	8758.75	3.069	0.434
34938	8759.00	2.880	0.439
34939	8759.25	2.719	0.461
34940	8759.50	2.547	0.459
34941	8759.75	2.404	0.468

Whitby tides¶