Spaces:
Running
Running
Update app.py
Browse filesremoved the filter with NAN and filtration based on year has been commented
app.py
CHANGED
@@ -85,10 +85,10 @@ def load_and_concat_data():
|
|
85 |
filtered_df = concatenated_df[columns_to_keep].reset_index(drop=True)
|
86 |
filtered_df['date_posted'] = pd.to_datetime(filtered_df['date_posted'], errors='coerce')
|
87 |
|
88 |
-
# Drop duplicates and rows with NaT in date_posted
|
89 |
-
filtered_df = filtered_df.drop_duplicates().dropna(subset=['date_posted'])
|
90 |
#filtering based on data in 2024
|
91 |
-
filtered_df = filtered_df[filtered_df['date_posted'].dt.year==2024]
|
92 |
# Convert titles and company name to lowercase
|
93 |
filtered_df['title'] = filtered_df['title'].str.lower()
|
94 |
filtered_df['company'] = filtered_df['company'].str.lower()
|
|
|
85 |
filtered_df = concatenated_df[columns_to_keep].reset_index(drop=True)
|
86 |
filtered_df['date_posted'] = pd.to_datetime(filtered_df['date_posted'], errors='coerce')
|
87 |
|
88 |
+
# Drop duplicates and rows with NaT in date_posted removed this to make it clear (jan13th)
|
89 |
+
#filtered_df = filtered_df.drop_duplicates().dropna(subset=['date_posted'])
|
90 |
#filtering based on data in 2024
|
91 |
+
#filtered_df = filtered_df[filtered_df['date_posted'].dt.year==2024]
|
92 |
# Convert titles and company name to lowercase
|
93 |
filtered_df['title'] = filtered_df['title'].str.lower()
|
94 |
filtered_df['company'] = filtered_df['company'].str.lower()
|