use gh-issues to update conferences.json (#503)

kjaymiller · dragid10 · web-flow · commit 76da3a91dcc5 · 2024-10-05T19:25:33.000-04:00
update issue template

update issue template to include start and end dates for conference

update conferences to use gh-issues instead of manual parsing

update conferences template to use grid and new json methods

add conferences.json

---------

Co-authored-by: Alex Oladele &lt;dragid10@gmail.com&gt;
diff --git a/.github/ISSUE_TEMPLATE/add_conference.yml b/.github/ISSUE_TEMPLATE/add_conference.yml
@@ -19,11 +19,17 @@ body:
     validations:
       required: true
   - type: input
-    id: conference_dates
+    id: conference_start_date
     attributes:
-      label: Conference Dates
-      description: The start and end date of the conference.
-      placeholder: "DD (MMM) -DD MMM YYYY"
+      label: Conference Start Date
+      description: The start date of the conference. Use `YEAR-MONTH-DAY`
+      placeholder: "2024-12-31"
+  - type: input
+    id: conference_end_date
+    attributes:
+      label: Conference End Date
+      description: The end date of the conference. The website will no longer show the conference after this date. Use `YEAR-MONTH-DAY` format.
+      placeholder: "2024-12-31"
   - type: dropdown
     id: conference_type
     attributes:
diff --git a/.github/workflows/conference.yml b/.github/workflows/conference.yml
@@ -66,10 +66,10 @@ jobs:
       - name: Setup Python environment
         uses: actions/setup-python@v4
         with:
-          python-version: "3.11"
+          python-version: "3.12"
 
       - name: Install dependencies
-        run: pip install PyGithub PyYAML pre-commit
+        run: pip install -r requirements-dev.txt
 
       - name: Run script
         env:
diff --git a/.gitignore b/.gitignore
@@ -17,3 +17,5 @@ vendor/
 2
 test_images
 *-version
+.DS_Store
+.coverage
diff --git a/Gemfile.lock b/Gemfile.lock
@@ -311,7 +311,7 @@ DEPENDENCIES
   webrick (~> 1.7)
 
 RUBY VERSION
-  ruby 3.3.4p94
+   ruby 3.3.5p100
 
 BUNDLED WITH
-  2.5.11
+   2.5.11
diff --git a/_conferences/__main__.py b/_conferences/__main__.py
@@ -1,117 +1,94 @@
-import os
-import re
-from datetime import datetime, time
-from pathlib import Path
+import datetime
+import pathlib
 from urllib.parse import urlparse
+from typing import Iterator
 
-import yaml
-from github import Auth, Github
-from github.Issue import Issue
-from github.PaginatedList import PaginatedList
+import json
+import gh_issues
 
-ROOT = Path(__file__).parent.parent
-conferences_path = ROOT / "_data/conferences.yml"
 
+QUERY = "repo:blackpythondevs/blackpythondevs.github.io type:issue label:conference"
 
-def create_github_client():
-    gh_token = os.getenv("GITHUB_TOKEN", "")
-    auth = Auth.Token(gh_token)
-    client = Github(auth=auth)
-    return client
 
-
-def get_open_issues(gh: Github) -> PaginatedList[Issue]:
-    repo = gh.get_repo("BlackPythonDevs/blackpythondevs.github.io")
-    issues = repo.get_issues(state="open", labels=["conference"])
+def get_conference_issues(
+    query: str = QUERY,
+) -> Iterator[gh_issues.Issue]:  # pragma no cover
+    issues = gh_issues.issues_by_query(query)
     return issues
 
 
-def parse_conference_details(issue_body: str) -> dict | None:
-    # Extract fields from issue body
-    name_match = re.search(
-        r"Conference Name(?:\r\n|\n){2}(.*?)(?:\r\n|\n){2}", issue_body
-    )
-    url_match = re.search(r"URL(?:\r\n|\n){2}(.*?)(?:\r\n|\n){2}", issue_body)
-    dates_match = re.search(
-        r"Conference Dates(?:\r\n|\n){2}(.*?)(?:\r\n|\n){2}", issue_body
-    )
-    type_match = re.search(
-        r"Conference Type(?:\r\n|\n){2}(.*?)(?:\r\n|\n){2}", issue_body
-    )
-    location_match = re.search(
-        r"Conference Location(?:\r\n|\n){2}(.*?)(?:\r\n|\n){2}", issue_body
-    )
-    summary_match = re.search(
-        r"Summary(?:\r\n|\n){2}(.*?)(?:\r\n|\n){2}",
-        issue_body,
-        re.DOTALL,
-    )
-    speaking_match = re.search(
-        r"Speaking(?:\r\n|\n){2}(.*?)(?:\r\n|\n){2}### Code of Conduct(?:\r\n|\n){2}",
-        issue_body,
-        re.DOTALL,
-    )
+def normalize_url(url_match: str | None) -> str | None:
+    """
+    Parse the url and see if a scheme (`https`) is included in it.
+    If not, then prepend `https` to the url from the issue body
 
-    # Set a default value of None for when the url field isn't as expected
-    valid_url = normalize_url() if not url_match else normalize_url(url_match[1])
-
-    if dates_match:
-        conferenceDates = dates_match[1]
-        # Parse the end date of the conference
-        endDateStr = conferenceDates.split("-")[1].strip()
-        endDate = datetime.strptime(endDateStr, "%d %b %Y")
-        # Check if the conference end date is greater than today
-        today = datetime.combine(datetime.now(), time())
-
-        if endDate >= today:
-            conference = {
-                "name": name_match[1],
-                "url": valid_url,
-                "dates": dates_match[1],
-                "type": type_match[1],
-                "location": location_match[1],
-                "summary": summary_match[1],
-                "speaking": speaking_match[1] if speaking_match else "",
-            }
-            return conference
-    return None
-
-
-def normalize_url(url_match: str = None):
-    valid_url = None
-    # Ensure the url field is not blank and the url matches the regex
-    if url_match is not None and url_match.strip() != "":
-        # Parse the url and see if a scheme (`https`) is included in it
-        # If not, then prepend `https` to the url from the issue body
-        # This guards against the website thinking the passed in url is another page on https://blackpythondevs.com/
+    This guards against the website thinking the passed in url is another page on https://blackpythondevs.com/
+    """
+    if url_match:
         parsed_url = urlparse(url_match)
+
         if "http" not in parsed_url.scheme.casefold():
-            valid_url = f"https://{url_match}"
+            return f"https://{url_match}"
         else:
-            valid_url = url_match
-    return valid_url
+            return url_match
 
 
 def write_conferences_to_file(confs: list[dict]):
     # Write the conferences to the _data/conferences.yml file
-    with conferences_path.open("w") as f:
-        yaml.dump(confs, f)
-
-
-if __name__ == "__main__":
-    conferences = []
-
-    # Create Github client object
-    gh_client = create_github_client()
-
-    # Get open issues from repo
-    open_issues: PaginatedList[Issue] = get_open_issues(gh_client)
-
-    # Parse each conference issue so long as it has the "conference" label
-    for issue in open_issues:
-        if "conference" in [label.name for label in issue.labels]:
-            parsed_conf = parse_conference_details(issue_body=issue.body)
-            if parsed_conf:
-                conferences.append(parsed_conf)
-
-    write_conferences_to_file(conferences)
+    conferences_path.write_text(json.dumps(confs))
+
+
+def __to_conference_date(conference_date: str) -> datetime.date:
+    return datetime.date.fromisoformat(conference_date)
+
+
+def parse_conference(issue: gh_issues.Issue) -> dict[str, str | None]:
+    """convert an issue to a dictionary of parsed data"""
+
+    KEYS = [
+        "conference_name",
+        "url",
+        "conference_start_date",
+        "conference_end_date",
+        "conference_type",
+        "conference_location",
+        "summary",
+        "speaking",
+    ]
+
+    _issue = {k: getattr(issue, k, None) for k in KEYS}
+    _issue["url"] = normalize_url(_issue.get("url", None))
+    return _issue
+
+
+def _validate_issue(issue: gh_issues.Issue, date_to_check: str) -> bool:
+    """Validate an issue based on its `date_to_check`"""
+    if not (valid_date := getattr(issue, date_to_check, False)):
+        return False
+    else:
+        return __to_conference_date(valid_date) >= datetime.date.today()
+
+
+def build_conferences() -> list[dict[str, str | None]]:  # pragma: no cover
+    return [
+        parse_conference(issue)
+        for issue in get_conference_issues()
+        if _validate_issue(issue, "conference_end_date")
+    ]
+
+
+if __name__ == "__main__":  # pragma: no cover
+    ROOT = pathlib.Path(__file__).parent.parent
+    conferences_path = ROOT.joinpath("_data/conferences.json")
+    conferences = build_conferences()
+    conferences_path.write_text(
+        json.dumps(
+            list(
+                sorted(
+                    conferences,
+                    key=lambda x: __to_conference_date(x["conference_start_date"]),
+                )
+            ),
+            indent=2,
+        )
+    )
diff --git a/_data/conferences.json b/_data/conferences.json
@@ -0,0 +1,22 @@
+[
+  {
+    "conference_name": "PyconUg",
+    "url": "https://ug.pycon.org",
+    "conference_start_date": "2024-10-09",
+    "conference_end_date": "2024-10-13",
+    "conference_type": "in-person",
+    "conference_location": "NWSC International Resource Centre (IREC), Kampala, Uganda",
+    "summary": "The conference is a five-day event, 9-13 October. PyconUganda inherit this tradition of an annual event that brings together python enthusiasts, tech audiences and technology business in uganda and around the world.",
+    "speaking": null
+  },
+  {
+    "conference_name": "PyHo",
+    "url": "https://twitter.com/pythonho",
+    "conference_start_date": "2024-10-25",
+    "conference_end_date": "2024-10-26",
+    "conference_type": "in-person",
+    "conference_location": "University of Health and Allied Sciences, Trafalgar,  Ho.  Ho, Volta Region, Ghana.",
+    "summary": "PyHo, champion the leverage of Python in education promote diversity and inclusion from underrepresented communities within\nthe/beyond our region. Provide the foundational platform for new and experienced speakers alike to share ideas and resources.",
+    "speaking": null
+  }
+]
diff --git a/_data/conferences.yml b/_data/conferences.yml
diff --git a/_includes/conferences.html b/_includes/conferences.html
@@ -1,23 +1,30 @@
 {% if site.data.conferences.size > 0 %}
+<div class="conference grid">
   {% for conference in site.data.conferences %}
-<div class="conference">
   <article>
     <h2>
-      <a href="{{ conference.url }}">{{ conference.name }}</a> ({{ conference.dates }}) {% if conference.location != "_No response_" %}- {{ conference.location }}{% endif %}
+      <a href="{{ conference.url }}">{{ conference.conference_name }}</a>
     </h2>
-    <p>Type: {{ conference.type }}</p>
+    <p>
+      <strong>{{ conference.conference_start_date }} - {{ conference.conference_end_date }}</strong>
+      {% if conference.conference_location != "_No response_" %}
+      <br />
+      <strong>{{ conference.conference_location }}</strong>
+      </p>
+      {% endif %}
+    <p>Type: {{ conference.conference_type }}</p>
     {% if conference.summary != "_No response_" %}
       {{ conference.summary | markdownify }}
     {% endif %}
-    {% if conference.speaking != "_No response_" %}
+    {% if conference.speaking %}
       <h3>Speaking:</h3>
       <li>
       {{ conference.speaking | markdownify }}
       </li>
     {% endif %}
   </article>
-</div>
   {% endfor %}
+</div>
 {% else %}
 <b>No conferences</b>
 {% endif %}
diff --git a/requirements-dev.txt b/requirements-dev.txt
@@ -1,6 +1,8 @@
 black
 ephemeral_port_reserve
+gh-issues
 pre-commit
+pytest-mock
 pytest-pyodide
 pytest-playwright
 pytest-xprocess
diff --git a/tests/test.py b/tests/test.py
diff --git a/tests/tests_conferences.py b/tests/tests_conferences.py

Original file line number	Diff line number	Diff line change
`@@ -17,3 +17,5 @@ vendor/`
`17`	`17`	`2`
`18`	`18`	`test_images`
`19`	`19`	`*-version`
	`20`	`+.DS_Store`
	`21`	`+.coverage`