Spaces:

AlvaroMros
/

ufc-predictor

Sleeping

App Files Files Community

Alvaro commited on Jul 3

Commit

b38f690

1 Parent(s): a49cbb2

Update

Browse files

Files changed (6) hide show

.gitignore +0 -1
output/ufc_events_detailed.json +3 -0
output/ufc_fights.csv +0 -0
src/analyze.py +15 -0
main.py → src/scrape_fights.py +0 -0
src/to_csv.py +87 -0

.gitignore DELETED Viewed

	@@ -1 +0,0 @@
1	- ufc_events_detailed.json

output/ufc_events_detailed.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:efffe902c81d1ab870852e9dd6d192e3b203e11b1a99a36c7ea97be451d197d6
+size 15088727

output/ufc_fights.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

src/analyze.py ADDED Viewed

	@@ -0,0 +1,15 @@

+import json
+ufc_events = json.load(open('ufc_events_detailed.json'))
+unique_fighters = set()
+for event in ufc_events:
+    for fight in event['fights']:
+        unique_fighters.add(fight['fighter_1'])
+        unique_fighters.add(fight['fighter_2'])
+print(len(unique_fighters))

main.py → src/scrape_fights.py RENAMED Viewed

File without changes

src/to_csv.py ADDED Viewed

	@@ -0,0 +1,87 @@

+import json
+import csv
+def json_to_csv(json_file_path, csv_file_path):
+    try:
+        with open(json_file_path, 'r', encoding='utf-8') as json_file:
+            data = json.load(json_file)
+    except FileNotFoundError:
+        print(f"Error: The file {json_file_path} was not found.")
+        return
+    except json.JSONDecodeError:
+        print(f"Error: Could not decode JSON from {json_file_path}.")
+        return
+    # Define the headers for the CSV file
+    headers = [
+        'event_name', 'event_date', 'event_location', 'fighter_1', 'fighter_2',
+        'weight_class', 'method', 'round', 'time',
+        'f1_kd', 'f1_sig_str', 'f1_sig_str_percent', 'f1_total_str', 'f1_td',
+        'f1_td_percent', 'f1_sub_att', 'f1_rev', 'f1_ctrl',
+        'f1_sig_str_head', 'f1_sig_str_body', 'f1_sig_str_leg', 'f1_sig_str_distance',
+        'f1_sig_str_clinch', 'f1_sig_str_ground',
+        'f2_kd', 'f2_sig_str', 'f2_sig_str_percent', 'f2_total_str', 'f2_td',
+        'f2_td_percent', 'f2_sub_att', 'f2_rev', 'f2_ctrl',
+        'f2_sig_str_head', 'f2_sig_str_body', 'f2_sig_str_leg', 'f2_sig_str_distance',
+        'f2_sig_str_clinch', 'f2_sig_str_ground'
+    ]
+    with open(csv_file_path, 'w', newline='', encoding='utf-8') as csv_file:
+        writer = csv.writer(csv_file)
+        writer.writerow(headers)
+        for event in data:
+            for fight in event.get('fights', []):
+                details = fight.get('details')
+                # Create a dictionary for easier and safer access to stats
+                f1_stats = details.get('fighter_1_stats', {}) if details else {}
+                f2_stats = details.get('fighter_2_stats', {}) if details else {}
+                row = [
+                    event.get('name', ''),
+                    event.get('date', ''),
+                    event.get('location', ''),
+                    fight.get('fighter_1', ''),
+                    fight.get('fighter_2', ''),
+                    fight.get('weight_class', ''),
+                    fight.get('method', ''),
+                    fight.get('round', ''),
+                    fight.get('time', ''),
+                    f1_stats.get('kd', ''),
+                    f1_stats.get('sig_str', ''),
+                    f1_stats.get('sig_str_percent', ''),
+                    f1_stats.get('total_str', ''),
+                    f1_stats.get('td', ''),
+                    f1_stats.get('td_percent', ''),
+                    f1_stats.get('sub_att', ''),
+                    f1_stats.get('rev', ''),
+                    f1_stats.get('ctrl', ''),
+                    f1_stats.get('sig_str_head', ''),
+                    f1_stats.get('sig_str_body', ''),
+                    f1_stats.get('sig_str_leg', ''),
+                    f1_stats.get('sig_str_distance', ''),
+                    f1_stats.get('sig_str_clinch', ''),
+                    f1_stats.get('sig_str_ground', ''),
+                    f2_stats.get('kd', ''),
+                    f2_stats.get('sig_str', ''),
+                    f2_stats.get('sig_str_percent', ''),
+                    f2_stats.get('total_str', ''),
+                    f2_stats.get('td', ''),
+                    f2_stats.get('td_percent', ''),
+                    f2_stats.get('sub_att', ''),
+                    f2_stats.get('rev', ''),
+                    f2_stats.get('ctrl', ''),
+                    f2_stats.get('sig_str_head', ''),
+                    f2_stats.get('sig_str_body', ''),
+                    f2_stats.get('sig_str_leg', ''),
+                    f2_stats.get('sig_str_distance', ''),
+                    f2_stats.get('sig_str_clinch', ''),
+                    f2_stats.get('sig_str_ground', '')
+                ]
+                writer.writerow(row)
+    print(f"Successfully converted {json_file_path} to {csv_file_path}")
+if __name__ == '__main__':
+    json_to_csv('ufc_events_detailed.json', 'ufc_fights.csv')