Spaces:
Sleeping
Sleeping
| import pandas as pd | |
| # Load your datasets | |
| twitter_data = pd.read_csv('cleaned_twitter_data.csv') # Twitter data | |
| reddit_data = pd.read_csv('cleaned_reddit_data.csv') # Reddit data | |
| aapl_stock_data = pd.read_csv('cleaned_AAPL_stock_data.csv') # AAPL stock data | |
| tsla_stock_data = pd.read_csv('cleaned_TSLA_stock_data.csv') # TSLA stock data | |
| # Print the column names to check if they match the expected columns | |
| print("Twitter Data Columns:", twitter_data.columns) | |
| print("Reddit Data Columns:", reddit_data.columns) | |
| print("AAPL Stock Data Columns:", aapl_stock_data.columns) | |
| print("TSLA Stock Data Columns:", tsla_stock_data.columns) | |
| # Convert 'Date' (Twitter/Reddit) or 'date' (Stock) to datetime | |
| # For Twitter and Reddit, the column might be 'Date' | |
| # For AAPL/TSLA stock data, the column is 'date' | |
| twitter_data['Date'] = pd.to_datetime(twitter_data['Date'], errors='coerce') | |
| reddit_data['Date'] = pd.to_datetime(reddit_data['Date'], errors='coerce') | |
| aapl_stock_data['Date'] = pd.to_datetime(aapl_stock_data['Date'], errors='coerce') | |
| tsla_stock_data['Date'] = pd.to_datetime(tsla_stock_data['Date'], errors='coerce') | |
| # Define the target date to filter data to (2024-12-30) | |
| target_date = pd.to_datetime('2024-12-30') | |
| # Filter the data to only include rows with the target date | |
| twitter_data_filtered = twitter_data[twitter_data['Date'] == target_date] | |
| reddit_data_filtered = reddit_data[reddit_data['Date'] == target_date] | |
| aapl_stock_data_filtered = aapl_stock_data[aapl_stock_data['Date'] == target_date] | |
| tsla_stock_data_filtered = tsla_stock_data[tsla_stock_data['Date'] == target_date] | |
| # Check the resulting filtered datasets | |
| print(f"Filtered Twitter Data: {twitter_data_filtered.shape}") | |
| print(f"Filtered Reddit Data: {reddit_data_filtered.shape}") | |
| print(f"Filtered AAPL Stock Data: {aapl_stock_data_filtered.shape}") | |
| print(f"Filtered TSLA Stock Data: {tsla_stock_data_filtered.shape}") | |
| # Optionally, save these filtered datasets to new CSV files | |
| twitter_data_filtered.to_csv('filtered_twitter_data.csv', index=False) | |
| reddit_data_filtered.to_csv('filtered_reddit_data.csv', index=False) | |
| aapl_stock_data_filtered.to_csv('filtered_aapl_stock_data.csv', index=False) | |
| tsla_stock_data_filtered.to_csv('filtered_tsla_stock_data.csv', index=False) | |