import os import json import pandas as pd import matplotlib.pyplot as plt import seaborn as sns data_dir = './' all_data = [] all_tap_logs = [] for filename in os.listdir(data_dir): if filename.endswith('.json'): file_path = os.path.join(data_dir, filename) with open(file_path, encoding='utf-8') as file: data = json.load(file) tap_logs = data.get('sensorLog', {}).get('tapLog', []) for entry in tap_logs: entry['participant_id'] = filename all_tap_logs.append(entry) df = pd.DataFrame(all_tap_logs) df['timestamp'] = pd.to_datetime(df['timestamp']) df['path'] = df['url'].apply(lambda x: x.split('://')[-1].split('/', 1)[-1]) # Mapping with tour_operators being mergeable to study page 2. :) path_to_label = { "study-page-1": "Study Page 1", "study-page-2": "Study Page 2", "study-page-3": "Study Page 3", "study-page-4": "Study Page 4", "study-page-5": "Study Page 5", "study-page-6": "Study Page 6", #"tour_operators": "Study Page 2" } df['label'] = df['path'].map(path_to_label) grouped = df.groupby('label') # JSON list structure def generate_heatmap_data(group): heatmap_data = group[['x', 'y']].copy() heatmap_data['radius'] = 40 heatmap_data['value'] = 5 heatmap_data['x'] = heatmap_data['x'].astype(str) heatmap_data['y'] = heatmap_data['y'].astype(str) heatmap_data_list = heatmap_data.to_dict(orient='records') min_value = 1 max_value = 9999 return { "min": min_value, "max": max_value, "data": heatmap_data_list } for label, group in grouped: heatmap_data = generate_heatmap_data(group.apply(lambda x: round(x))) json_filename = f"{label.replace(' ', '_').lower()}.json" with open(json_filename, 'w', encoding='utf-8') as json_file: json.dump(heatmap_data, json_file, indent=4) print(f"Generated {json_filename} with {len(heatmap_data)} records.")