diff --git a/analysis_notebook_hashtag.ipynb b/analysis_notebook_hashtag.ipynb index 4777b28..39814b4 100644 --- a/analysis_notebook_hashtag.ipynb +++ b/analysis_notebook_hashtag.ipynb @@ -89,7 +89,7 @@ "source": [ "# Changes 'created_at' to data format datetime64[ns, tzlocal()]\n", "# That is necessary for date specific filtering\n", - "df['created_at'] = pd.to_datetime(df['created_at'], utc=True)\n", + "df['created_at'] = pd.to_datetime(df['created_at'], errors='coerce', utc=True)\n", "\n", "# Adding the column 'instance' by extracting the domain name (and suffix) from the column 'url' of the post\n", "df['instance'] = df['url'].apply(lambda x: urlparse(x)[1])"