# import library
import pandas as pd
import datetime
import pytz

# url for the latest data set
url = "https://www.data.qld.gov.au/datastore/dump/2bbef99e-9974-49b9-a316-57402b00609c?bom=True"

# read the data set to the notebook with index "_id" 
wave_df = pd.read_csv(url,index_col="_id")

# display the date of access# Get current time in local timezone
localTimezone = pytz.timezone('Australia/Brisbane')  
waveRecentAccess = datetime.datetime.now(localTimezone)
print(f"The current data was accessed on {waveRecentAccess:%d-%m-%Y %H:%M}")

# get column names
wave_headings = list(wave_df.columns)

# display column names
[noRow,noCol]=wave_df.shape # spread the shape of the data frame into two variables
print(f"There are {noRow} rows in the dataframe.")
print(f"There are {noCol} columns in the dataframe, which are:")
for col in wave_headings:
    print(">",col)

The current data was accessed on 13-04-2025 22:23
,There are 7504 rows in the dataframe.
,There are 14 columns in the dataframe, which are:
,> Site
,> SiteNumber
,> Seconds
,> DateTime
,> Latitude
,> Longitude
,> Hsig
,> Hmax
,> Tp
,> Tz
,> SST
,> Direction
,> Current Speed
,> Current Direction

# save the data retrieved from the internet
path="data/"
file_name_recent=f'wave_data({waveRecentAccess}).csv'
wave_df.to_csv(f'{path}{file_name_recent}')

# Read the data locally with index "_id"
wave_file_df = pd.read_csv(f"{path}{file_name_recent}",index_col="_id")
wave_file_df

wave_file_df['DateTime'] = pd.to_datetime(wave_file_df['DateTime'], errors='coerce')
print(wave_file_df.dtypes)

Site                         object
,SiteNumber                   object
,Seconds                       int64
,DateTime             datetime64[ns]
,Latitude                    float64
,Longitude                   float64
,Hsig                        float64
,Hmax                        float64
,Tp                          float64
,Tz                          float64
,SST                         float64
,Direction                   float64
,Current Speed               float64
,Current Direction           float64
,dtype: object

wave_file_df['Site'] = wave_file_df['Site'].str.replace('Mk4','').str.rstrip()
print("> new set of site names:",set(wave_file_df["Site"]))

> new set of site names: {'Wide Bay', 'Gladstone', 'Cairns', 'Caloundra', 'Brisbane', 'Gold Coast', 'Emu Park', 'Tweed Heads', 'Townsville', 'Palm Beach', 'Mackay', 'Poruma West', 'Mooloolaba', 'Albatross Bay', 'Tweed Offshore', 'North Moreton Bay', 'Hay Point TriAxys', 'Bundaberg', 'Skardon River Outer', 'Bilinga'}

# Filtering data
wave_SEQ_df=wave_file_df[wave_file_df["Latitude"]<-26.56]
wave_SEQ_df = wave_SEQ_df[['Site','DateTime','Hsig', 'Tz','Longitude', 'Latitude']]
wave_SEQ_df

# Sorting data
wave_SEQ_df=wave_SEQ_df.copy()
wave_SEQ_df = wave_SEQ_df.sort_values(by=["DateTime","Latitude"], ascending=[True, False])
wave_SEQ_df

# Grouping the filtered data and obtaining daily maximum Hsig and Tz
wave_SEQ_group_max_df = wave_SEQ_df.groupby(["Site", wave_SEQ_df['DateTime'].dt.date], sort=False).agg({'Hsig': 'max','Tz': 'max','Longitude': 'first','Latitude': 'first'})
wave_SEQ_group_max_df = wave_SEQ_group_max_df.reset_index(names=['Site','DateTime'])

wave_SEQ_group_max_df

import plotly.express as px

# the range of data
startDate=min(wave_SEQ_group_max_df["DateTime"])
endDate=max(wave_SEQ_group_max_df["DateTime"])
dateRange=f"{startDate} to {endDate}"

# significant wave height across time 
lineChartHsig = px.line(
    wave_SEQ_group_max_df, 
    x="DateTime", 
    y="Hsig", 
    color="Site", 
    title=f"Figure 1: Daily maximum significant wave height <br> of South East Queensland: {dateRange}",
     labels={"DateTime": "Date", "Hsig": "average sigificant wave height (m)"},
    width=750,
    height=500
)
lineChartHsig.show()

# zero upcrossing wave period across time 
lineChartTz = px.line(
    wave_SEQ_group_max_df, 
    x="DateTime", 
    y="Tz", 
    color="Site", 
    title=f"Figure 2: Daily maximum average zero upcrossing wave period <br> of South East Queensland: {dateRange}",
     labels={"DateTime": "Date", "Tz": "Zero Upcrossing Wave Period (s)"},
    width=750,
    height=500
)
lineChartTz.show()

color_map = {"Hsig": "red", "Tz": "blue"}
currentTime= datetime.datetime.now()

# Filter for the last 48 hours
wave_recent_48h = wave_SEQ_df[wave_SEQ_df["DateTime"] >= currentTime - pd.Timedelta(hours=38)]


# Create the line plot with separate subplots for each Site
lineChartHsigSites = px.line(
    wave_recent_48h,
    x="DateTime",
    y=["Hsig", "Tz"], 
    facet_col="Site",
    facet_col_wrap=3,
    height=800, 
    title=f"Figure 3: Past 48 hours Significant Wave Height (Hsig) and Zero Upcrossing Wave Period (Tz) of South East Queensland<br> (update at: {waveRecentAccess:%Y-%m-%d %H:%M})",
    labels={"DateTime": "Date", "Hsig": "Significant Wave Height (m)", "Tz": "Average Zero Upcrossing Wave Period (s)"},
    color_discrete_map=color_map,  # Apply custom colors
)

lineChartHsigSites.update_layout(
    title_font_size=15,  
    title_x=0.5,  
    legend_title_font_size=15,
)

# Add a horizontal line at 6m for Hsig
lineChartHsigSites.add_hline(
    y=6,
    line_dash="dash",
    line_color="red",
    annotation_text="6m potential damage",
    annotation_position="bottom right",
)

# Add a horizontal line at 12s for Tz
lineChartHsigSites.add_hline(
    y=12,
    line_dash="dot",
    line_color="blue",
    annotation_text="12s potential risk",
    annotation_position="top left",
)

lineChartHsigSites.update_traces(
    selector=dict(name="Hsig"),  
    name="Significant Wave Height (m)",  
)
lineChartHsigSites.update_traces(
    selector=dict(name="Tz"),  # Select Tz trace
    name="Zero Upcrossing Wave Period (s)",  # Custom legend label for Tz
)


for annotation in lineChartHsigSites.layout.annotations:
    annotation.text = annotation.text.replace("Site=", "")  # Clean up facet titles

# Show the plot
lineChartHsigSites.show()

latestWaveData = wave_SEQ_df.groupby("Site",sort=False)[["Hsig","Tz","DateTime"]].last().reset_index()


scatterFig=px.scatter(latestWaveData, 
    x="Tz", 
    y="Hsig", 
    color="Site", 
    title=f"Figure 4: Latest Significant Wave Height (Hsig) and Average Zero Upcrossing Wave Period (Tz) <br> of South East Queensland (update at: {waveRecentAccess:%Y-%m-%d %H:%M})",
    labels={"Tz": "Average Zero Upcrossing Wave Period (s)", "Hsig": "Sigificant wave height (m)"}
)

scatterFig.update_traces(marker=dict(size=12))  
scatterFig.add_hline(
    y=6,
    line=dict(color="red", dash="dash"),
    annotation_text="6m potential damage to foreshore",
    annotation_position="top left",

 )
scatterFig.add_vline(
    x=12,
    line=dict(color="blue", dash="dash"),
    annotation_text="12s potential risk",
    annotation_position="bottom right",

 )

scatterFig.show()

# Import necessary libraries
import pandas as pd
import datetime
import plotly.express as px
import pytz

stormTideURL="https://www.data.qld.gov.au/datastore/dump/7afe7233-fae0-4024-bc98-3a72f05675bd?bom=True"

tide_df=pd.read_csv(stormTideURL,index_col="_id")

localTimezone = pytz.timezone('Australia/Brisbane')  
tideRecentAccess = datetime.datetime.now(localTimezone)

print(f"The current data was accessed on {tideRecentAccess:%Y-%m-%d %H:%M}")

tide_headings = list(tide_df.columns)
site_list=set(tide_df["Site"])

[noRow,noCol]=tide_df.shape 
print(f"There are {noRow} rows.")
print(f"There are {noCol} columns, which are:")
for col in tide_headings:
    print(">",col)

print(f"Data are from {len(site_list)} site(s).")
print(', '.join(site_list))

The current data was accessed on 2025-04-13 22:23
,There are 65830 rows.
,There are 8 columns, which are:
,> Site
,> Seconds
,> DateTime
,> Water Level
,> Prediction
,> Residual
,> Latitude
,> Longitude
,Data are from 57 site(s).
,mackaynew, burketown, dalbay, maroochydore, morningtonA, townsvillecard, birkdale, wavebreaknc, clumppoint, cairns, stpauls, lucinda, mourilyan, seaforth, capeferg, bowen, weipanx, husseycreek, gcseaway, cooktown, tweedsbj, rabybay, russellislande, whyteislandnx, mossman, palmcove, scarborough, weipahumbug, goldcoast, portalma, bundaberg, hallsbay, theskids, portdouglas, coombabahst, bananabank, cardwell, abellpoint, noosasandstg, boigu, iama, shorncliffe, townsville, thursdayisland, karumba, ugar, warraber, kubin, tangalooma, rosslyn, urangan, southtrees, wavebreakwc, burnett, mooloolaba, russellislandw, goldenbeach

path="data/"
file_name_recent_tide=f'storm_tide_data({tideRecentAccess}).csv'
tide_df.to_csv(f'{path}{file_name_recent_tide}')

tide_file_df = pd.read_csv(f"{path}{file_name_recent_tide}",index_col="_id")
tide_file_df

tide_file_df['DateTime'] = pd.to_datetime(tide_file_df['DateTime'], errors='coerce')
print(tide_file_df.dtypes)

Site                   object
,Seconds                 int64
,DateTime       datetime64[ns]
,Water Level           float64
,Prediction            float64
,Residual              float64
,Latitude              float64
,Longitude             float64
,dtype: object

tide_file_df = tide_file_df.rename(columns={
    "Prediction": "Astronomical Tide",
    "Residual": "Storm Surge"
})

print(tide_file_df.describe())

            Seconds                       DateTime   Water Level  \
,count  6.583000e+04                          65830  65830.000000   
,mean   1.744202e+09  2025-04-09 22:30:00.000000256    -14.387510   
,min    1.743862e+09            2025-04-06 00:00:00    -99.000000   
,25%    1.744031e+09            2025-04-07 23:10:00      0.737000   
,50%    1.744202e+09            2025-04-09 22:30:00      1.542000   
,75%    1.744372e+09            2025-04-11 21:50:00      2.439000   
,max    1.744542e+09            2025-04-13 21:00:00      5.994000   
,std    1.965892e+05                            NaN     37.178146   
,
,       Astronomical Tide   Storm Surge      Latitude     Longitude  
,count       65830.000000  65830.000000  65830.000000  65830.000000  
,mean           -0.027155    -15.910470    -20.949007    146.209679  
,min           -99.000000    -99.000000    -28.172100      0.000000  
,25%             0.946000     -0.022000    -27.178000    145.403200  
,50%             1.539000      0.096000    -21.176600    149.266050  
,75%             2.321000      0.173000    -16.927700    153.119600  
,max             6.029000      2.158000      0.000000    153.557700  
,std            13.145607     36.497613      6.607690     19.898097

tide_file_df=tide_file_df[tide_file_df["Water Level" or "Astronomical Tide" or "Storm Surge"]!=-99]
tide_file_df=tide_file_df[tide_file_df["Longitude"]!=-0]

tide_lat_centre = (max(tide_file_df[tide_file_df["Site"]=="goldcoast"]['Latitude']) + min(tide_file_df[tide_file_df["Site"]=="goldcoast"]['Latitude']))/2
tide_lon_centre = (max(tide_file_df[tide_file_df["Site"]=="goldcoast"]['Longitude']) + min(tide_file_df[tide_file_df["Site"]=="goldcoast"]['Longitude']))/2

tideFig = px.scatter_map(tide_file_df, lat="Latitude", lon="Longitude",
                     size_max=60, zoom=9, 
                    center={'lat':tide_lat_centre, 'lon':tide_lon_centre},text="Site")
tideFig.show()

targetSite="goldcoast"
properSiteName="Gold Coast"
tide_TS_df=tide_file_df[tide_file_df["Site"]==targetSite]
tide_TS_df.loc[tide_TS_df["Site"] == targetSite, "Site"] = properSiteName

tide_TS_df

wave_lat_centre = (max(wave_file_df[wave_file_df["Site"]=="Gold Coast"]['Latitude']) + min(wave_file_df[wave_file_df["Site"]=="Gold Coast"]['Latitude']))/2
wave_lon_centre = (max(wave_file_df[wave_file_df["Site"]=="Gold Coast"]['Longitude']) + min(wave_file_df[wave_file_df["Site"]=="Gold Coast"]['Longitude']))/2

waveFig = px.scatter_map(wave_file_df, lat="Latitude", lon="Longitude",
                     size_max=60, zoom=9, 
                    center={'lat':wave_lat_centre, 'lon':wave_lon_centre},text="Site",color_discrete_sequence=["red"])
waveFig.show()

wave_TS_df=wave_SEQ_df[wave_SEQ_df["Site"]==properSiteName]

wave_TS_df

currentTime= datetime.datetime.now()

tide_TS_recent_df=tide_TS_df[tide_TS_df["DateTime"] >= currentTime - pd.Timedelta(hours=38)] 

tide_TS_recent_df

wave_subset = wave_TS_df[['DateTime', 'Hsig', 'Tz']]
wave_tide_merged_df = pd.merge_asof(tide_TS_recent_df, wave_subset, on='DateTime', direction='nearest')

wave_tide_merged_df['Wave Setup'] = wave_tide_merged_df['Hsig'] * 0.2

wave_tide_merged_df

wave_tide_TS_recent_max_df=wave_tide_merged_df.groupby("Site")[['Astronomical Tide','Storm Surge','Wave Setup']].max()

wave_tide_TS_recent_max_df = wave_tide_TS_recent_max_df.reset_index(names=['Site'])

wave_tide_TS_recent_max_df

HAT=2.16

fig1 = px.area(
    wave_tide_merged_df,
    x="DateTime",
    y=["Astronomical Tide", "Storm Surge", "Wave Setup"],
    title=f"Figure 5: Water level of the past 48 hours in Surfers Paradise <br> (Update on {tideRecentAccess:%Y-%m-%d %H:%M})",
    labels={
        "DateTime": "Date Time",
        "value": "Water Level (m) LAT",
        "variable": "Water Level Component"
    },
)

fig1.add_hline(
    y=HAT,
    line=dict(color="red", dash="dash", width=2),
    annotation_text="HAT",
    annotation_position="top left" 
)


fig1.show()

df_long = wave_tide_TS_recent_max_df.melt(id_vars='Site', var_name='Quantity', value_name='Height')


fig2 = px.bar(
    df_long,
    width=500,
    x='Site',
    y='Height',
    color='Quantity',  
    barmode='stack',
    title=f'Figure 6: Predicted maximum water level <br> (Update on {tideRecentAccess:%Y-%m-%d %H:%M})',
    labels={
        "Site": "",
        "Height": "Water Level (m LAT)",
        "Quantity": "Water Level Component"
    },
)

fig2.add_hline(
    y=HAT,
    line=dict(color="red", dash="dash", width=2),
    annotation_text="HAT",
    annotation_position="top left" 
)

fig2.show()

wave_tide_merged_df["Storm tide"]=wave_tide_merged_df["Astronomical Tide"]+wave_tide_merged_df["Storm Surge"]+wave_tide_merged_df["Wave Setup"]
wave_tide_merged_df

exceeds_HAT_df = wave_tide_merged_df[wave_tide_merged_df['Storm tide'] >= HAT ].copy()

exceeds_HAT_df['exceedance'] = exceeds_HAT_df['Storm tide'] - HAT

noExceed=exceeds_HAT_df.shape[0]
totalRecord=wave_tide_merged_df.shape[0]
percentage=noExceed/totalRecord

hadFlooding=noExceed > 0

if hadFlooding :
    display(HTML(f'<h4 style="color:red; padding:50px">{percentage:0.00%} of the records exceeds HAT in the past 48 hours:</h4>'))
    print(exceeds_HAT_df[['DateTime', 'Storm tide', 'exceedance']])
else:
    display(HTML('<h4 style="color:green; padding:50px">No records exceeding HAT in the past 48 hours</h4>'))

               DateTime  Storm tide  exceedance
,127 2025-04-12 19:40:00       2.165       0.005
,138 2025-04-12 21:30:00       2.185       0.025
,198 2025-04-13 07:30:00       2.633       0.473
,201 2025-04-13 08:00:00       2.248       0.088
,272 2025-04-13 19:50:00       2.259       0.099

highestPossible=wave_tide_TS_recent_max_df["Astronomical Tide"]+wave_tide_TS_recent_max_df["Storm Surge"]+wave_tide_TS_recent_max_df["Wave Setup"]

possibleHigherThanHAT=round(highestPossible[0] - HAT,1)>0

if (possibleHigherThanHAT):
    display(HTML('<h4 style="color:red; padding:50px">If the storm surge and wave conditions remain, it is possible to flood in Surfers Paradise.'))
else:
    display(HTML('<h4 style="color:green; padding:50px">If the storm surge and wave conditions remain, it is not possible to flood in Surfers Paradise in the future 12 hours.</h4>'))

date_range=''
if (possibleHigherThanHAT):
    exceedance_list = []
    
    for index, row in wave_tide_merged_df[wave_tide_merged_df["DateTime"] >= currentTime - pd.Timedelta(hours=14)].iterrows():
        total_water_level = row["Astronomical Tide"] + wave_tide_TS_recent_max_df["Storm Surge"] + wave_tide_TS_recent_max_df["Wave Setup"]
        if total_water_level[0] > HAT:
            new_datetime = row["DateTime"] + pd.Timedelta(hours=24)
            exceedance_list.append({"DateTime": new_datetime, "Exceedance": round(total_water_level[0] - HAT,1)})
    
    exceedance_df = pd.DataFrame(exceedance_list)

    
    if not exceedance_df.empty:
        date_range = exceedance_df["DateTime"].min()
        exceedance_range = (exceedance_df["Exceedance"].min(), exceedance_df["Exceedance"].max())
        display(HTML(f'<h4 style="color:red; padding:50px">Flooding may happen from {date_range:%Y-%m-%d %H:%M}.</h4>'))
        display(HTML(f'<h4 style="color:red; padding:50px">The highest water level go {exceedance_range[1]:0.1f} m above HAT.</h4>'))

trend_df = wave_tide_merged_df[wave_tide_merged_df["DateTime"] >= currentTime - pd.Timedelta(hours=14)].copy()
trend_df['change'] = trend_df['Storm Surge'].diff()

meanChange = round(trend_df['change'].mean(), 2)

surgeBuildUp=meanChange > 0

if meanChange > 0:
    display(HTML('<h4 style="color:red; padding:50px"> The storm surge shows an upward trend in the past 24 hours, indicating that it may be building up. </h4>'))
    trend="building up"
elif meanChange < 0:
    display(HTML('<h4 style="color:green; padding:50px">> The storm surge shows a downward trend in the past 24 hours, indicating that it may be weakening. </h4>'))
    trend="weakening"
else:
    display(HTML('<h4 style="padding:50px"> There is no significant change in the storm surge over the past 24 hours. </h4>'))
    trend="no signficant change"

flood_report = f"""
<div style="">
    <h2>Gold Coast Surfers Paradise Flood Report and Forecast</h2>
    <p><strong>In the past 48 hours:</strong> 
        <span style="color: {'red' if hadFlooding else 'green'};">{percentage:0.00%}</span> 
        records of storm tide exceeding the Highest Astronomical Tide.
    </p>
    <p><strong>If the storm surge continues:</strong> There 
        <span style="color: {'red' if possibleHigherThanHAT else 'green'};">
            {'will' if possibleHigherThanHAT else 'will not'}
        </span> 
        be potential flooding 
        <strong>{'from '+date_range.strftime('%Y-%m-%d %H:%M') if possibleHigherThanHAT else ''}</strong>.
    </p>
    <p><strong>The storm surge trend:</strong> 
        <span style="color: {'red' if surgeBuildUp else 'green'};">{trend.capitalize()}</span>.
    </p>
</div>
"""

display(HTML(flood_report))

	Site	SiteNumber	Seconds	DateTime	Latitude	Longitude	Hsig	Hmax	Tp	Tz	SST	Direction	Current Speed	Current Direction
_id
1	Caloundra	54	1743861600	2025-04-06T00:00:00	-26.84675	153.15581	0.714	1.14	6.67	5.479	25.25	85.80	-99.9	-99.9
2	Caloundra	54	1743863400	2025-04-06T00:30:00	-26.84688	153.15564	0.716	1.23	6.67	5.479	25.25	81.60	-99.9	-99.9
3	Caloundra	54	1743865200	2025-04-06T01:00:00	-26.84700	153.15555	0.677	1.20	6.67	5.634	25.15	83.00	-99.9	-99.9
4	Caloundra	54	1743867000	2025-04-06T01:30:00	-26.84697	153.15549	0.717	1.29	6.67	5.797	25.15	87.20	-99.9	-99.9
5	Caloundra	54	1743868800	2025-04-06T02:00:00	-26.84699	153.15553	0.708	1.10	6.67	5.714	25.20	87.20	-99.9	-99.9
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
7500	Hay Point TriAxys	4740tx	1744537200	2025-04-13 19:40:00	-21.27830	149.32270	1.860	2.91	5.60	4.800	26.50	119.26	-99.9	-99.9
7501	Hay Point TriAxys	4740tx	1744538400	2025-04-13 20:00:00	-21.27830	149.32270	1.940	3.15	5.90	5.000	26.48	122.26	-99.9	-99.9
7502	Hay Point TriAxys	4740tx	1744539600	2025-04-13 20:20:00	-21.27830	149.32260	1.900	3.04	5.90	5.000	26.47	114.26	-99.9	-99.9
7503	Hay Point TriAxys	4740tx	1744540800	2025-04-13 20:40:00	-21.27830	149.32260	1.890	3.21	6.20	5.200	26.45	115.26	-99.9	-99.9
7504	Hay Point TriAxys	4740tx	1744542000	2025-04-13 21:00:00	-21.27820	149.32250	1.930	3.51	5.90	4.900	26.44	114.26	-99.9	-99.9

	Site	DateTime	Hsig	Tz	Longitude	Latitude
_id
1	Caloundra	2025-04-06 00:00:00	0.714	5.479	153.15581	-26.84675
2	Caloundra	2025-04-06 00:30:00	0.716	5.479	153.15564	-26.84688
3	Caloundra	2025-04-06 01:00:00	0.677	5.634	153.15555	-26.84700
4	Caloundra	2025-04-06 01:30:00	0.717	5.797	153.15549	-26.84697
5	Caloundra	2025-04-06 02:00:00	0.708	5.714	153.15553	-26.84699
...	...	...	...	...	...	...
6558	Bilinga	2025-04-13 18:30:00	1.590	5.770	153.51279	-28.14245
6559	Bilinga	2025-04-13 19:00:00	1.730	6.190	153.51281	-28.14244
6560	Bilinga	2025-04-13 19:30:00	1.810	6.540	153.51277	-28.14196
6561	Bilinga	2025-04-13 20:00:00	1.720	6.160	153.51281	-28.14193
6562	Bilinga	2025-04-13 20:30:00	1.950	6.170	153.51279	-28.14193

	Site	DateTime	Hsig	Tz	Longitude	Latitude
_id
746	Mooloolaba	2025-04-06 00:00:00	1.044	5.797	153.18452	-26.56684
1	Caloundra	2025-04-06 00:00:00	0.714	5.479	153.15581	-26.84675
375	North Moreton Bay	2025-04-06 00:00:00	0.754	5.333	153.28159	-26.90002
4818	Brisbane	2025-04-06 00:00:00	1.070	5.270	153.63188	-27.48649
5194	Gold Coast	2025-04-06 00:00:00	0.980	6.090	153.43906	-27.96435
...	...	...	...	...	...	...
4817	Palm Beach	2025-04-13 20:00:00	2.030	5.770	153.48567	-28.09926
6561	Bilinga	2025-04-13 20:00:00	1.720	6.160	153.51281	-28.14193
4103	Tweed Heads	2025-04-13 20:00:00	2.410	6.130	153.57637	-28.17828
5571	Gold Coast	2025-04-13 20:30:00	2.330	5.840	153.43921	-27.96417
6562	Bilinga	2025-04-13 20:30:00	1.950	6.170	153.51279	-28.14193

	Site	DateTime	Hsig	Tz	Longitude	Latitude
0	Mooloolaba	2025-04-06	1.329	6.250	153.18452	-26.56684
1	Caloundra	2025-04-06	0.891	5.970	153.15581	-26.84675
2	North Moreton Bay	2025-04-06	1.053	5.797	153.28159	-26.90002
3	Brisbane	2025-04-06	1.740	6.950	153.63188	-27.48649
4	Gold Coast	2025-04-06	1.190	7.210	153.43906	-27.96435
...	...	...	...	...	...	...
67	Gold Coast	2025-04-13	2.550	5.960	153.43906	-27.96420
68	Palm Beach	2025-04-13	2.430	6.040	153.48579	-28.09923
69	Bilinga	2025-04-13	2.190	6.540	153.51283	-28.14198
70	Tweed Heads	2025-04-13	2.560	6.260	153.57632	-28.17834
71	Tweed Offshore	2025-04-13	3.040	6.570	153.68205	-28.21257

	Site	Seconds	DateTime	Water Level	Prediction	Residual	Latitude	Longitude
_id
1	abellpoint	1743861600	2025-04-06T00:00	1.121	1.103	0.018	-20.2608	148.7103
2	abellpoint	1743862200	2025-04-06T00:10	1.128	1.119	0.009	-20.2608	148.7103
3	abellpoint	1743862800	2025-04-06T00:20	1.142	1.142	0.000	-20.2608	148.7103
4	abellpoint	1743863400	2025-04-06T00:30	1.157	1.172	-0.015	-20.2608	148.7103
5	abellpoint	1743864000	2025-04-06T00:40	1.175	1.207	-0.032	-20.2608	148.7103
...	...	...	...	...	...	...	...	...
65826	whyteislandnx	1744539600	2025-04-13T20:20	2.010	1.980	0.030	-27.4017	153.1574
65827	whyteislandnx	1744540200	2025-04-13T20:30	2.070	2.037	0.033	-27.4017	153.1574
65828	whyteislandnx	1744540800	2025-04-13T20:40	2.116	2.091	0.025	-27.4017	153.1574
65829	whyteislandnx	1744541400	2025-04-13T20:50	-99.000	2.141	-99.000	-27.4017	153.1574
65830	whyteislandnx	1744542000	2025-04-13T21:00	-99.000	2.186	-99.000	-27.4017	153.1574

	Site	Seconds	DateTime	Water Level	Astronomical Tide	Storm Surge	Latitude	Longitude
_id
18161	Gold Coast	1743861600	2025-04-06 00:00:00	1.166	1.074	0.092	-27.9386	153.4326
18162	Gold Coast	1743862200	2025-04-06 00:10:00	1.219	1.109	0.110	-27.9386	153.4326
18163	Gold Coast	1743862800	2025-04-06 00:20:00	1.228	1.141	0.087	-27.9386	153.4326
18164	Gold Coast	1743863400	2025-04-06 00:30:00	1.268	1.173	0.095	-27.9386	153.4326
18165	Gold Coast	1743864000	2025-04-06 00:40:00	1.298	1.204	0.094	-27.9386	153.4326
...	...	...	...	...	...	...	...	...
19289	Gold Coast	1744538400	2025-04-13 20:00:00	1.531	1.551	-0.020	-27.9386	153.4326
19290	Gold Coast	1744539000	2025-04-13 20:10:00	1.691	1.563	0.128	-27.9386	153.4326
19291	Gold Coast	1744539600	2025-04-13 20:20:00	1.565	1.569	-0.004	-27.9386	153.4326
19292	Gold Coast	1744540200	2025-04-13 20:30:00	1.580	1.570	0.010	-27.9386	153.4326
19293	Gold Coast	1744540800	2025-04-13 20:40:00	1.490	1.566	-0.076	-27.9386	153.4326

	Site	Seconds	DateTime	Water Level	Astronomical Tide	Storm Surge	Latitude	Longitude
_id
19016	Gold Coast	1744374600	2025-04-11 22:30:00	0.969	0.831	0.138	-27.9386	153.4326
19017	Gold Coast	1744375200	2025-04-11 22:40:00	0.927	0.779	0.148	-27.9386	153.4326
19018	Gold Coast	1744375800	2025-04-11 22:50:00	0.930	0.726	0.204	-27.9386	153.4326
19019	Gold Coast	1744376400	2025-04-11 23:00:00	0.837	0.676	0.161	-27.9386	153.4326
19020	Gold Coast	1744377000	2025-04-11 23:10:00	0.837	0.627	0.210	-27.9386	153.4326
...	...	...	...	...	...	...	...	...
19289	Gold Coast	1744538400	2025-04-13 20:00:00	1.531	1.551	-0.020	-27.9386	153.4326
19290	Gold Coast	1744539000	2025-04-13 20:10:00	1.691	1.563	0.128	-27.9386	153.4326
19291	Gold Coast	1744539600	2025-04-13 20:20:00	1.565	1.569	-0.004	-27.9386	153.4326
19292	Gold Coast	1744540200	2025-04-13 20:30:00	1.580	1.570	0.010	-27.9386	153.4326
19293	Gold Coast	1744540800	2025-04-13 20:40:00	1.490	1.566	-0.076	-27.9386	153.4326

Data for both Part A and Part B¶

Part A¶

QUESTION:¶

[Q1] Read the data¶

[Q2] Save the data¶

Read the data from a file¶

[Q3] Analyse the data¶

Correct the data format¶

Correct the name of sites¶

Filter data¶

Sort data¶

Group the filtered data¶

Obtain appropriate aggregates for the groups¶

[Q4] Visualise the data¶

Daily maximum Hsig and Tz trends across sites¶

Past 48 hour trend of Hsig and Tz in different sites¶

Current Hsig and Tz value in different sites¶

[Q5] Extract Insights¶

What can we learn from the wave height data for South East Queensland?¶

How might this data be used strategically during a major weather event?¶

Who might benefit nost from the data?¶

Part B - creating a narrative to answer significant questions¶

Question¶

Data¶

Read the data¶

Save the data¶

Read the data from a file¶

Analysis¶

Convert the data type¶

Rename the column¶

Reference framework: LAT¶

Review the data¶

Clean the invalid data¶

Filter the data to include only site in Surfers Paradise¶

Get the recent 48 hours data¶

Integrate the storm tide components¶

Obtain an appropriate aggregate¶

Visualisation¶

Visualize past storm tide trends¶

Visualize the maximum storm tide¶

Insight¶

Assess flood risk¶

Show records exceed HAT in the past 48 hours¶

2% of the records exceeds HAT in the past 48 hours:

Predict whether flooding will happen¶

If the storm surge and wave conditions remain, it is possible to flood in Surfers Paradise.

Predict when will the flood occur¶

Flooding may happen from 2025-04-13 22:30.

The highest water level go 0.7 m above HAT.

Predict with the trend of the storm surge¶

There is no significant change in the storm surge over the past 24 hours.

Summary¶

Gold Coast Surfers Paradise Flood Report and Forecast

Limitations¶

Reference¶