{ "cells": [ { "cell_type": "code", "execution_count": 13, "id": "52701550-0bda-4fa4-959f-2b42eb42e140", "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 14, "id": "8cb2dd41-79e1-45bf-a0eb-ff9abc0baa8b", "metadata": {}, "outputs": [], "source": [ "df = pd.read_csv(\"cleaned_data_with_categories.csv\")" ] }, { "cell_type": "code", "execution_count": 15, "id": "c4e79890-de47-4774-9445-142cff46cf86", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | id | \n", "Headline | \n", "Summary | \n", "Severity | \n", "Category | \n", "Region | \n", "Datetime | \n", "Year | \n", "lat | \n", "lon | \n", "URL | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "3 | \n", "Shanghai port congestion impacts terminals in ... | \n", "The persisting port congestion at Shanghai’s... | \n", "Minor | \n", "Maritime Advisory | \n", "China | \n", "27/4/17 9:16 | \n", "2017 | \n", "29.52000 | \n", "121.33190 | \n", "NaN | \n", "
1 | \n", "17 | \n", "24 hour pier hold in effect at Port of Durban | \n", "Industry sources indicate on August 31 that th... | \n", "Minor | \n", "Port Congestion | \n", "South Africa | \n", "31/8/18 18:07 | \n", "2018 | \n", "-29.86875 | \n", "31.03305 | \n", "NaN | \n", "
2 | \n", "1599 | \n", "Heavy congestion reported at Port of Houston | \n", "According to sources on March 20, heavy conges... | \n", "Moderate | \n", "Port Congestion | \n", "United States | \n", "20/3/19 12:43 | \n", "2019 | \n", "29.60949 | \n", "-95.00567 | \n", "NaN | \n", "
3 | \n", "1600 | \n", "Heavy congestion reported at Port of Long Beach | \n", "According to sources on January 7, heavy conge... | \n", "Severe | \n", "Port Congestion | \n", "United States | \n", "7/1/19 9:50 | \n", "2019 | \n", "33.75448 | \n", "-118.21663 | \n", "NaN | \n", "
4 | \n", "1613 | \n", "High risk of pilot suspension reported at Port... | \n", "On December 31, shipping sources indicate that... | \n", "Minor | \n", "Severe Winds | \n", "Japan | \n", "31/12/19 10:23 | \n", "2019 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
100 | \n", "3756 | \n", "Magnitude 5.1 earthquake reported 12 kilometer... | \n", "The United States Geological Survey has confir... | \n", "Moderate | \n", "Earthquake | \n", "Japan | \n", "25/9/20 17:35 | \n", "2020 | \n", "33.12568 | \n", "139.80898 | \n", "NaN | \n", "
101 | \n", "3757 | \n", "Magnitude 5.2 earthquake recorded 30 kilometer... | \n", "The United States Geological Survey (USGS) has... | \n", "Moderate | \n", "Earthquake | \n", "Philippines | \n", "6/1/20 8:03 | \n", "2020 | \n", "5.41372 | \n", "125.40147 | \n", "NaN | \n", "
102 | \n", "3758 | \n", "Magnitude 5.3 earthquake reported 17 km west o... | \n", "The United States Geological Survey (USGS) has... | \n", "Moderate | \n", "Earthquake | \n", "Philippines | \n", "9/5/20 20:09 | \n", "2020 | \n", "14.06667 | \n", "120.63333 | \n", "NaN | \n", "
103 | \n", "3759 | \n", "Magnitude 6.2 earthquake reported north of Sur... | \n", "The US Geological Survey is reporting that a m... | \n", "Severe | \n", "Earthquake | \n", "Indonesia | \n", "5/2/20 19:37 | \n", "2020 | \n", "-6.23324 | \n", "112.93235 | \n", "NaN | \n", "
104 | \n", "5715 | \n", "USGS reports magnitude 6.3 earthquake 4km sout... | \n", "The United States Geological Survey (USGS) has... | \n", "Severe | \n", "Earthquake | \n", "Philippines | \n", "25/12/20 0:25 | \n", "2020 | \n", "13.83333 | \n", "120.63330 | \n", "NaN | \n", "
105 rows × 11 columns
\n", "\n", " | id | \n", "Headline | \n", "Summary | \n", "Severity | \n", "Region | \n", "Datetime | \n", "Year | \n", "lat | \n", "lon | \n", "URL | \n", "
---|---|---|---|---|---|---|---|---|---|---|
Category | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
Maritime Advisory | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "13 | \n", "13 | \n", "0 | \n", "
Earthquake | \n", "18 | \n", "18 | \n", "18 | \n", "17 | \n", "18 | \n", "18 | \n", "18 | \n", "14 | \n", "14 | \n", "0 | \n", "
Port Congestion | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "11 | \n", "11 | \n", "0 | \n", "
Severe Winds | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "3 | \n", "3 | \n", "0 | \n", "
Port Disruption | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "4 | \n", "4 | \n", "0 | \n", "
Port Closure | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "2 | \n", "2 | \n", "0 | \n", "
Miscellaneous Strikes | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "0 | \n", "
Maritime Accident | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "0 | \n", "
Maritime Accident/Ground Transportation Advisory | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "
Tropical Cyclone / Storm, Severe Winds, Flooding, Evacuation, Air Travel Disruption, Port Closure, Power Outage, Public Safety / Security, Weather Advisory, Travel Warning | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Tropical Cyclone / Storm | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Public Utilities Disruption, Water Restriction Program | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Protest/Riot, Port Disruption, Cargo Disruption, Climate Change | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Protest / Riot, Public Safety / Security, Public Transportation Disruption, Police Operations, Roadway Closure / Disruption, Hazmat Response, Bombing | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Protest / Riot | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Cargo Disruption | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Political Crackdown / Opposition Movement | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Chemical Spill, Maritime Accident, Port Disruption, Hazmat Response, Public Safety / Security | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Maritime Accident/Port Disruption | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Maritime Accident, Maritime Advisory, Police Operations, Maritime Accident/Ground Transportation Advisory | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Maritime Accident / Hazmat Response | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Industrial Action, Maritime Advisory, Miscellaneous Strikes, Public Safety / Security | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Hazmat Response | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Ground Transportation Advisory / Brexit Contingency / Government Plan / Traffic Management / Border Control / Cross-Channel Traffic | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Ground Transportation Advisory | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Death / Injury, Individuals in Focus, Public Safety / Security, Public Transportation Disruption, Roadway Closure / Disruption | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "
Weather Advisory | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
\n", " | id | \n", "Headline | \n", "Summary | \n", "Severity | \n", "Category | \n", "Region | \n", "Datetime | \n", "Year | \n", "lat | \n", "lon | \n", "URL | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
GPT Generated Result | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
Maritime Advisory | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "13 | \n", "13 | \n", "0 | \n", "
Earthquake | \n", "18 | \n", "18 | \n", "18 | \n", "17 | \n", "18 | \n", "18 | \n", "18 | \n", "18 | \n", "14 | \n", "14 | \n", "0 | \n", "
Miscellaneous Events | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "6 | \n", "6 | \n", "0 | \n", "
Port Congestion | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "13 | \n", "11 | \n", "11 | \n", "0 | \n", "
Severe Winds | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "3 | \n", "3 | \n", "0 | \n", "
Port Disruption | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "4 | \n", "4 | \n", "0 | \n", "
Port Closure | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "2 | \n", "2 | \n", "0 | \n", "
Miscellaneous Strikes | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "0 | \n", "
Maritime Accident | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "0 | \n", "
Cargo Disruption | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Ground Transportation Advisory | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Hazmat Response | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
Weather Advisory | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
\n", " | Unnamed: 0 | \n", "id | \n", "Headline | \n", "Summary | \n", "Severity | \n", "Category_GoldenResult | \n", "Category_GPT | \n", "Region | \n", "Datetime | \n", "Year | \n", "lat | \n", "lon | \n", "URL | \n", "GPT Generated Result | \n", "Result_Golden | \n", "Result_GPT | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "86 | \n", "10 | \n", "14 miles NE of Jakarta - A magnitude 4.5 earth... | \n", "A magnitude 4.5 earthquake was detected 14 mil... | \n", "Moderate | \n", "Earthquake | \n", "Earthquake | \n", "Indonesia | \n", "24/9/18 18:33 | \n", "2018 | \n", "-6.10000 | \n", "107.02000 | \n", "NaN | \n", "Earthquake | \n", "True | \n", "True | \n", "
1 | \n", "87 | \n", "11 | \n", "17 miles SW of Batangas - A magnitude 5.5 eart... | \n", "Multiple sources report that a magnitude 5.5 e... | \n", "NaN | \n", "Earthquake | \n", "Earthquake | \n", "Philippines | \n", "31/8/18 15:04 | \n", "2018 | \n", "13.55600 | \n", "120.90300 | \n", "NaN | \n", "Earthquake | \n", "True | \n", "True | \n", "
2 | \n", "88 | \n", "16 | \n", "23 miles ESE of Taichung City- A magnitude 4.5... | \n", "A magnitude 4.5 earthquake was detected in cen... | \n", "Moderate | \n", "Earthquake | \n", "Earthquake | \n", "Taiwan | \n", "17/8/18 10:40 | \n", "2018 | \n", "24.02000 | \n", "121.03000 | \n", "NaN | \n", "Earthquake | \n", "True | \n", "True | \n", "
3 | \n", "89 | \n", "20 | \n", "33 miles SE of Valencia A magnitude 4.0 earthq... | \n", "The European-Mediterranean Seismological Centr... | \n", "Moderate | \n", "Earthquake | \n", "Earthquake | \n", "Spain | \n", "17/10/18 6:06 | \n", "2018 | \n", "39.23000 | \n", "0.16000 | \n", "NaN | \n", "Earthquake | \n", "True | \n", "True | \n", "
4 | \n", "90 | \n", "1981 | \n", "Philippines: Magnitude 6.2 earthquake recorded... | \n", "The United States Geological Survey (USGS) has... | \n", "Severe | \n", "Earthquake | \n", "Earthquake | \n", "Philippines | \n", "29/9/19 3:35 | \n", "2019 | \n", "6.35667 | \n", "126.18441 | \n", "NaN | \n", "Earthquake | \n", "True | \n", "True | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
94 | \n", "53 | \n", "2824 | \n", "UPDATE: High winds still causing port disrupti... | \n", "Industry sources on April 23 indicate that hig... | \n", "Moderate | \n", "Port Congestion | \n", "Weather Advisory | \n", "Saudi Arabia | \n", "18/4/19 13:31 | \n", "2019 | \n", "21.46250 | \n", "39.16000 | \n", "NaN | \n", "Weather Advisory | \n", "True | \n", "False | \n", "
95 | \n", "49 | \n", "2815 | \n", "UPDATE: Fog causing congestion in Houston, aff... | \n", "Updated sources report fog has delayed vessel ... | \n", "Severe | \n", "Port Congestion | \n", "NaN | \n", "United States | \n", "11/3/19 7:48 | \n", "2019 | \n", "29.68234 | \n", "-94.99355 | \n", "NaN | \n", "NaN | \n", "True | \n", "False | \n", "
96 | \n", "54 | \n", "2827 | \n", "UPDATE: Inbound pilotage suspended due to stro... | \n", "Sources indicate that strong winds have led to... | \n", "Moderate | \n", "Port Congestion | \n", "NaN | \n", "China | \n", "22/1/19 10:08 | \n", "2019 | \n", "31.32010 | \n", "121.65733 | \n", "NaN | \n", "NaN | \n", "True | \n", "False | \n", "
97 | \n", "60 | \n", "2869 | \n", "UPDATE: Port of Busan reopens after temporary ... | \n", "Updated sources indicate on October 4 that the... | \n", "Moderate | \n", "Port Congestion | \n", "NaN | \n", "Republic of Korea | \n", "30/9/19 11:41 | \n", "2019 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
98 | \n", "61 | \n", "2870 | \n", "UPDATE: Port of Charleston is open for busines... | \n", "Updated media sources indicate on September 6 ... | \n", "Severe | \n", "Port Congestion | \n", "NaN | \n", "United States | \n", "3/9/19 5:28 | \n", "2019 | \n", "32.90473 | \n", "-79.96455 | \n", "NaN | \n", "NaN | \n", "True | \n", "False | \n", "
99 rows × 16 columns
\n", "\n", " | Unnamed: 0 | \n", "id | \n", "Headline | \n", "Summary | \n", "Severity | \n", "Category_GPT | \n", "Region | \n", "Datetime | \n", "Year | \n", "lat | \n", "lon | \n", "URL | \n", "GPT Generated Result | \n", "Result_Golden | \n", "Result_GPT | \n", "Result_GPT_True_Count | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
Category_GoldenResult | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
Maritime Advisory | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "19 | \n", "20 | \n", "20 | \n", "20 | \n", "15 | \n", "15 | \n", "0 | \n", "19 | \n", "20 | \n", "20 | \n", "20 | \n", "
Miscellaneous Events | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "12 | \n", "12 | \n", "0 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "
Port Closure | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "16 | \n", "20 | \n", "20 | \n", "20 | \n", "15 | \n", "15 | \n", "0 | \n", "16 | \n", "20 | \n", "20 | \n", "20 | \n", "
Port Congestion | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "20 | \n", "16 | \n", "20 | \n", "20 | \n", "20 | \n", "11 | \n", "11 | \n", "0 | \n", "16 | \n", "20 | \n", "20 | \n", "20 | \n", "
Earthquake | \n", "19 | \n", "19 | \n", "19 | \n", "19 | \n", "18 | \n", "18 | \n", "19 | \n", "19 | \n", "19 | \n", "15 | \n", "15 | \n", "0 | \n", "18 | \n", "19 | \n", "19 | \n", "19 | \n", "