Niharmahesh commited on
Commit
fa541cf
·
verified ·
1 Parent(s): 31cc020

Update app.py

Browse files

removed the filter with NAN and filtration based on year has been commented

Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -85,10 +85,10 @@ def load_and_concat_data():
85
  filtered_df = concatenated_df[columns_to_keep].reset_index(drop=True)
86
  filtered_df['date_posted'] = pd.to_datetime(filtered_df['date_posted'], errors='coerce')
87
 
88
- # Drop duplicates and rows with NaT in date_posted
89
- filtered_df = filtered_df.drop_duplicates().dropna(subset=['date_posted'])
90
  #filtering based on data in 2024
91
- filtered_df = filtered_df[filtered_df['date_posted'].dt.year==2024]
92
  # Convert titles and company name to lowercase
93
  filtered_df['title'] = filtered_df['title'].str.lower()
94
  filtered_df['company'] = filtered_df['company'].str.lower()
 
85
  filtered_df = concatenated_df[columns_to_keep].reset_index(drop=True)
86
  filtered_df['date_posted'] = pd.to_datetime(filtered_df['date_posted'], errors='coerce')
87
 
88
+ # Drop duplicates and rows with NaT in date_posted removed this to make it clear (jan13th)
89
+ #filtered_df = filtered_df.drop_duplicates().dropna(subset=['date_posted'])
90
  #filtering based on data in 2024
91
+ #filtered_df = filtered_df[filtered_df['date_posted'].dt.year==2024]
92
  # Convert titles and company name to lowercase
93
  filtered_df['title'] = filtered_df['title'].str.lower()
94
  filtered_df['company'] = filtered_df['company'].str.lower()