adding the bot and associated scripts

ohbm · Jun 21, 2024 · b51c490 · b51c490
1 parent ca8445b
commit b51c490
Show file tree

Hide file tree

Showing 8 changed files with 1,087 additions and 0 deletions.
diff --git a/_data/projects.json b/_data/projects.json
diff --git a/scripts/delete_duplicate_channels.py b/scripts/delete_duplicate_channels.py
@@ -0,0 +1,38 @@
+import discord
+import logging
+from dotenv import load_dotenv
+import os
+
+# Initialize logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger('discord')
+
+class ProjectsClient(discord.Client):
+    def __init__(self, guild_id: int, *args, **kwargs):
+        intents = discord.Intents.default()
+        super().__init__(intents=intents, *args, **kwargs)
+        self._guild_id = guild_id
+
+    async def on_ready(self):
+        logger.info(f'Logged in as {self.user} (ID: {self.user.id})')
+        logger.info('------')
+        guild = self.get_guild(self._guild_id)
+        if guild:
+            await self.delete_non_entrance_channels(guild)
+        await self.close()
+
+    async def delete_non_entrance_channels(self, guild: discord.Guild):
+        for channel in guild.channels:
+            if isinstance(channel, (discord.TextChannel, discord.VoiceChannel)):
+                if channel.name.lower() != "entrance" and channel.category is None:
+                    logger.info(f'Deleting channel: {channel.name} (ID: {channel.id})')
+                    await channel.delete()
+        logger.info('Finished deleting non-entrance channels.')
+
+if __name__ == '__main__':
+    load_dotenv()
+    guild_id = int(os.getenv('DISCORD_GUILD_ID', ''))
+    token = os.getenv('DISCORD_TOKEN', '')
+
+    client = ProjectsClient(guild_id)
+    client.run(token)
diff --git a/scripts/ensure_discord.py b/scripts/ensure_discord.py
@@ -0,0 +1,18 @@
+import os
+from projects_bot import ProjectsClient
+
+if __name__ == '__main__':
+    from dotenv import load_dotenv
+    load_dotenv()
+
+    token = os.getenv('DISCORD_TOKEN', '')
+    guild = int(os.getenv('DISCORD_GUILD_ID', ''))
+    roles_channel = int(os.getenv('DISCORD_ROLES_CHANNEL', ''))
+
+    client = ProjectsClient(
+        guild, roles_channel,
+        # just_ensure_channels=True,
+        # just_ensure_events=True
+        sleep_mode=False
+    )
+    client.run(token)
diff --git a/scripts/fetch_gh_issues.py b/scripts/fetch_gh_issues.py
@@ -0,0 +1,139 @@
+#!/bin/env python
+
+# Import necessary modules
+import os
+import re
+import requests
+import yaml
+import json
+
+# Define the main function to fetch GitHub issues
+def fetch_gh_issues():
+
+    # Get GitHub authentication token from environment variable
+    GH_AUTH = os.environ['GH_AUTH']
+
+    # Define the repository and issue labels
+    REPO = 'ohbm/hackathon2024'
+    ISSUE_LABEL = ':rocket: HackTrack Project'
+    ISSUE_READY_LABEL = ':mag: Review: Good to go ✅'
+
+    # Define issue filters for the API request
+    ISSUE_FILTER = f'labels={ISSUE_LABEL}&per_page=100'
+    ISSUE_FILTER = f'per_page=100'
+
+    # Construct the API URL with the authentication token and filters
+    URL = f'https://{GH_AUTH}@api.github.com/repos/{REPO}/issues?{ISSUE_FILTER}'
+
+    # Load the issue form template from a YAML file
+    with open('.github/ISSUE_TEMPLATE/brainhack-hacktrack-project.yml') as f:
+        issue_form = yaml.safe_load(f)
+
+    # Get the fields from the issue form template, excluding markdown fields
+    fields = issue_form['body']
+    fields = [f for f in fields if f['type'] != 'markdown']
+
+    # Make a request to the GitHub API to fetch issues
+    res = requests.get(URL)
+    issues = res.json()
+
+    # Initialize a list to store the filtered issue information
+    issues_list = []
+
+    # Loop through each issue
+    for issue in issues:
+
+        # Skip issues that do not have the "Good to go" label or are not open
+        if ISSUE_READY_LABEL not in [i['name'] for i in issue["labels"]]:
+            continue
+        if issue["state"] != "open":
+            continue
+
+        try:
+            # Extract and process the issue body text
+            body = issue["body"]
+            lines = [l.strip() for l in body.replace('\r\n', '\n').split('\n')]
+
+            field_ordering = []
+
+            # Determine the order of fields in the issue body
+            for field in fields:
+                field_start = None
+                field_label = field['attributes']['label']
+
+                for li, line in enumerate(lines):
+                    is_line_title = line.startswith(f'### {field_label}')
+                    if field_start is None and is_line_title:
+                        field_start = li
+
+                field_ordering += [(field, field_start)]
+            field_ordering = list(sorted(field_ordering, key=lambda f: f[1]))
+
+            issue_info = {}
+
+            # Extract the values for each field in the issue
+            field_bounds = zip(field_ordering, field_ordering[1:] + [(None, None)])
+            for (field, i), (_, ni) in field_bounds:
+                field_id = field['id']
+                field_label = field['attributes']['label']
+
+                if i is None:
+                    issue_info[field_id] = None
+                    continue
+
+                field_value = '\n'.join(filter(None, lines[i+1:ni]))
+
+                # Remove HTML comments from the field value
+                field_value = re.sub(
+                    r'<!--.*?-->', '', field_value,
+                    flags=re.DOTALL
+                )
+                field_value = field_value.strip()
+
+                # Handle default "No response" values
+                if field_value == '_No response_':
+                    field_value = None
+
+                # Process checkbox fields
+                if field['type'] == 'checkboxes':
+                    field_options_labels = [
+                        o['label'].strip()
+                        for o in field['attributes']['options']
+                    ]
+                    field_selected_options = []
+                    field_options_value = field_value.split('\n')
+                    for l in field_options_value:
+                        if l[6:] not in field_options_labels:
+                            continue
+                        if l.startswith('- [X] '):
+                            field_selected_options.append(l[6:])
+                        if l.startswith('- [x] '):
+                            field_selected_options.append(l[6:])
+
+                    field_value = field_selected_options
+
+                issue_info[field_id] = field_value
+
+            # Remove the primary hub from the list of other hubs
+            if issue_info['hub'] in issue_info['otherhub']:
+                issue_info['otherhub'].remove(issue_info['hub'])
+
+            # Add issue link and number to the issue info
+            issue_info['issue_link'] = issue["html_url"]
+            issue_info['issue_number'] = issue["number"]
+            issues_list.append(issue_info)
+
+        # Skip issues that raise exceptions
+        except:
+            pass
+
+    # Write the filtered issue information to a JSON file
+    with open('./_data/projects.json', 'w') as f:
+        json.dump(issues_list, f, indent=2)
+
+# Run the fetch_gh_issues function if the script is executed directly
+if __name__ == '__main__':
+    from dotenv import load_dotenv
+    load_dotenv()
+
+    fetch_gh_issues()
diff --git a/scripts/fetch_gh_proceedings.py b/scripts/fetch_gh_proceedings.py
@@ -0,0 +1,138 @@
+#!/bin/env python
+
+# Import necessary modules
+import os
+import re
+import requests
+import yaml
+import json
+
+# Define the main function to fetch GitHub issues
+def fetch_gh_issues():
+
+    # Get GitHub authentication token from environment variable
+    GH_AUTH = os.environ['GH_AUTH']
+
+    # Define the repository and issue label
+    REPO = 'ohbm/hackathon2024'
+    ISSUE_LABEL = 'Proceedings'
+    # ISSUE_READY_LABEL = 'Good to go'  # Commented out, not used in this script
+
+    # Define issue filter for the API request
+    ISSUE_FILTER = f'labels={ISSUE_LABEL}&per_page=100'
+
+    # Construct the API URL with the authentication token and filters
+    URL = f'https://{GH_AUTH}@api.github.com/repos/{REPO}/issues?{ISSUE_FILTER}'
+
+    # Load the issue form template from a YAML file
+    with open('.github/ISSUE_TEMPLATE/hackathon-proceedings.yml') as f:
+        issue_form = yaml.safe_load(f)
+
+    # Get the fields from the issue form template, excluding markdown fields
+    fields = issue_form['body']
+    fields = [f for f in fields if f['type'] != 'markdown']
+
+    # Make a request to the GitHub API to fetch issues
+    res = requests.get(URL)
+    issues = res.json()
+
+    # Initialize a list to store the filtered issue information
+    issues_list = []
+
+    # Loop through each issue
+    for issue in issues:
+
+        print("looking for issue", issue['url'])
+
+        # Skip issues that are not in the 'open' state
+        if issue["state"] != "open":
+            continue
+
+        print('passed')
+
+        try:
+            # Extract and process the issue body text
+            body = issue["body"]
+            lines = [l.strip() for l in body.replace('\r\n', '\n').split('\n')]
+
+            field_ordering = []
+
+            # Determine the order of fields in the issue body
+            for field in fields:
+                field_start = None
+                field_label = field['attributes']['label']
+
+                for li, line in enumerate(lines):
+                    is_line_title = line.startswith(f'### {field_label}')
+                    if field_start is None and is_line_title:
+                        field_start = li
+
+                field_ordering += [(field, field_start)]
+            field_ordering = list(sorted(field_ordering, key=lambda f: f[1]))
+
+            issue_info = {}
+
+            # Extract the values for each field in the issue
+            field_bounds = zip(field_ordering, field_ordering[1:] + [(None, None)])
+            for (field, i), (_, ni) in field_bounds:
+                field_id = field['id']
+                field_label = field['attributes']['label']
+
+                if i is None:
+                    issue_info[field_id] = None
+                    continue
+
+                field_value = '\n'.join(filter(None, lines[i+1:ni]))
+
+                # Remove HTML comments from the field value
+                field_value = re.sub(
+                    r'<!--.*?-->', '', field_value,
+                    flags=re.DOTALL
+                )
+                field_value = field_value.strip()
+
+                # Handle default "No response" values
+                if field_value == '_No response_':
+                    field_value = None
+
+                # Process checkbox fields
+                if field['type'] == 'checkboxes':
+                    field_options_labels = [
+                        o['label'].strip()
+                        for o in field['attributes']['options']
+                    ]
+                    field_selected_options = []
+                    field_options_value = field_value.split('\n')
+                    for l in field_options_value:
+                        if l[6:] not in field_options_labels:
+                            continue
+                        if l.startswith('- [X] '):
+                            field_selected_options.append(l[6:])
+                        if l.startswith('- [x] '):
+                            field_selected_options.append(l[6:])
+
+                    field_value = field_selected_options
+
+                issue_info[field_id] = field_value
+
+            # Add issue link and number to the issue info
+            issue_info['issue_link'] = issue["html_url"]
+            issue_info['issue_number'] = issue["number"]
+            issues_list.append(issue_info)
+
+        # Handle and log any exceptions that occur during processing
+        except Exception as e:
+            print("error in issue", issue['url'])
+            print(e)
+            raise e
+
+    # Write the filtered issue information to a JSON file
+    with open('./public/proceedings.json', 'w') as f:
+        json.dump(issues_list, f, indent=2)
+
+# Run the fetch_gh_issues function if the script is executed directly
+if __name__ == '__main__':
+    from dotenv import load_dotenv
+    load_dotenv()
+
+    fetch_gh_issues()