digital-land
diff --git a/‎.github/workflows/daily-issue-tracking.yml‎
Lines changed: 49 additions & 0 deletions b/‎.github/workflows/daily-issue-tracking.yml‎
Lines changed: 49 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎Makefile‎
Lines changed: 11 additions & 0 deletions b/‎Makefile‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎bin/admin_data/label_module_map.csv‎
Lines changed: 46 additions & 0 deletions b/‎bin/admin_data/label_module_map.csv‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎bin/csv_helpers.py‎
Lines changed: 25 additions & 0 deletions b/‎bin/csv_helpers.py‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎bin/github_api.py‎
Lines changed: 185 additions & 0 deletions b/‎bin/github_api.py‎
Lines changed: 185 additions & 0 deletions
@@ -0,0 +1,49 @@
+name: Daily Issue Tracking Update
+
+on:
+  schedule:
+    # Run daily at 9:00 AM UTC (adjust as needed)
+    - cron: '0 9 * * *'
+  workflow_dispatch:  # Allow manual triggering
+
+jobs:
+  update-issue-tracking:
+    runs-on: ubuntu-latest
+    
+    steps:
+    - name: Checkout repository
+      uses: actions/checkout@v4
+      with:
+        token: ${{ secrets.GITHUB_TOKEN }}
+        
+    - name: Set up Python
+      uses: actions/setup-python@v5
+      with:
+        python-version: '3.10'
+        
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        make init
+        
+    - name: Set up environment variables
+      env:
+        GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+      run: |
+        echo "GITHUB_TOKEN=$GITHUB_TOKEN" > .env
+        
+    - name: Generate issue report
+      working-directory: bin
+      run: |
+        python -c "from issue_tracking import gen_issue_report; gen_issue_report()"
+        
+    - name: Generate markdown output
+      working-directory: bin
+      run: |
+        python -c "from issue_tracking_output import generate_issue_tracking_index; generate_issue_tracking_index()"
+        
+    - name: Commit and push changes
+      run: |
+        git config --local user.email "action@github.com"
+        git config --local user.name "GitHub Action"
+        make commit-issue-tracking
@@ -295,3 +295,5 @@ dist
 .python-version
 .vscode
 package-lock.json
+
+cache/
@@ -1,3 +1,6 @@
+# current git branch
+BRANCH := $(shell git rev-parse --abbrev-ref HEAD)
+
 init::
 	python -m pip install --upgrade pip
 	python -m pip install pip-tools
@@ -8,3 +11,11 @@ init::
 
 checks:
 	python3 bin/check.py
+
+
+status:
+	git status --ignored
+
+commit-issue-tracking::
+	git add .
+	git diff --quiet && git diff --staged --quiet || (git commit -m "Latest issue tracking updates $(shell date +%F)"; git push origin $(BRANCH))
@@ -0,0 +1,46 @@
+github_label,module
+"component: Type of proposed advertisement",advertisement-types
+"component: advertisement period",advert-period
+"component: agent contact details",agent-contact
+"component: applicant contact details",applicant-contact
+"component: application for tree works - checklist",checklist
+"component: application reqs - checklist",checklist
+"component: checklist",checklist
+"component: declaration",declaration
+"component: demolition",demolition
+"component: designated area",designated-areas
+"component: details proposed adverts",proposed-advert-details
+"component: employment",employment
+"component: foul sewage",foul-sewage
+"component: pedestrian and vehicle access",access-rights-of-way
+"component: planning application req - checklist",checklist
+"component: processes and machinery",processes-machinery-waste
+"component: res units",res-units
+"component: site area",site-area
+"component: trade effluent",trade-effluent
+"component: trees location",trees-location
+"component: type of dev",dev-type
+"component: vehicle parking",vehicle-parking
+"component: waste and storage",waste-storage-collection
+"component:agent name and address",agent-details
+"component:applicant name and address",applicant-details
+"component:assessment of flood risk",flood-risk-assessment
+"component:authority employee / member",conflict-of-interest
+"component:bio geo conservation",bio-geo-arch-con
+"component:biodiversity net gain",bng
+"component:description of the proposal",proposal-details
+"component:development description",proposal-details
+"component:eligibility",eligibility
+"component:eligibility current building",eligibility-current-building
+"component:ground for app",grounds-for-application
+"component:grounds for app ldc",grounds-ldc
+"component:immunity from listing",immunity-from-listing
+"component:location of advertisement(s)",advert-location
+"component:materials",materials
+"component:neighbour and community consultation",community-consultation
+"component:non-res floorspace",non-res-floorspace
+"component:ownership certificates",ownership-certs
+"component:ownership certs + agr",ownership-certs
+"component:pre-application advice",pre-app-advice
+"component:site address details",site-details
+"component:site visit",site-visit
@@ -0,0 +1,25 @@
+import csv
+
+
+def read_csv(filename, encoding="utf-8", as_dict=False, include_row_num=False):
+    # Read the CSV file
+    with open(filename, newline="", encoding=encoding) as csvfile:
+        data = []
+        if as_dict:
+            reader = csv.DictReader(csvfile)
+            # Start row numbering at 1
+            for i, row in enumerate(reader, start=1):
+
+                if include_row_num:
+                    row["_row_num"] = i
+                data.append(row)
+        else:
+            reader = csv.reader(csvfile)
+            # Start row numbering at 1
+            for i, row in enumerate(reader, start=1):
+                if include_row_num:
+                    # Insert the row number at the start of the row
+                    row.insert(0, i)
+                data.append(row)
+
+    return data
@@ -0,0 +1,185 @@
+import os
+from collections import Counter
+from datetime import datetime
+from typing import Any, Dict, List
+
+import requests
+from json_helpers import load_json, save_json
+
+# from dotenv import load_dotenv
+
+# load_dotenv()
+
+cached_issues_file = "cache/github_issues_cache.json"
+
+
+def get_open_issues(
+    repo_owner: str = "digital-land",
+    repo_name: str = "planning-application-data-specification",
+    github_token: str = None,
+) -> List[Dict[str, Any]]:
+    """
+    Fetch all open issues from a GitHub repository.
+
+    Args:
+        repo_owner: GitHub repository owner
+        repo_name: GitHub repository name
+        github_token: GitHub token for authentication (optional)
+
+    Returns:
+        List of issue dictionaries
+    """
+    # if github_token is None:
+    #     github_token = os.getenv("GITHUB_TOKEN")
+
+    # HEADERS (use token for higher rate limit)
+    headers = {
+        "Accept": "application/vnd.github+json",
+        "X-GitHub-Api-Version": "2022-11-28",
+    }
+    if github_token:
+        headers["Authorization"] = f"Bearer {github_token}"
+
+    # PAGINATION VARIABLES
+    issues_url = f"https://api.github.com/repos/{repo_owner}/{repo_name}/issues"
+    params = {"state": "open", "per_page": 100, "page": 1}
+
+    all_issues = []
+
+    # PAGINATE THROUGH RESULTS
+    while True:
+        try:
+            response = requests.get(issues_url, headers=headers, params=params)
+
+            # Handle rate limiting
+            if response.status_code == 403:
+                print(f"Error 403: {response.json().get('message', 'Forbidden')}")
+                if "rate limit" in response.text.lower():
+                    print("You've hit the rate limit. Please:")
+                    print("1. Wait a bit and try again")
+                    print(
+                        "2. Add a GITHUB_TOKEN environment variable for higher limits"
+                    )
+                break
+
+            response.raise_for_status()
+            issues = response.json()
+
+            if not issues:
+                break
+
+            for issue in issues:
+                # Skip pull requests (they are also issues)
+                if "pull_request" not in issue:
+                    all_issues.append(issue)
+
+            params["page"] += 1
+
+        except requests.exceptions.HTTPError as e:
+            print(f"HTTP Error: {e}")
+            print(f"Response: {response.text}")
+            break
+        except Exception as e:
+            print(f"Unexpected error: {e}")
+            break
+
+    return all_issues
+
+
+def save_issues_to_file(
+    issues: List[Dict[str, Any]], filename: str = cached_issues_file
+):
+    data = {
+        "fetch_timestamp": datetime.now().isoformat(),
+        "fetch_timestamp_human": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
+        "issue_count": len(issues),
+        "issues": issues,
+    }
+    save_json(data, filename)
+
+
+def load_issues_from_file(filename: str = cached_issues_file) -> Dict[str, Any]:
+    data = load_json(filename)
+    if not data:
+        print("No data found.")
+        return None
+
+    return data
+
+
+def get_issues_with_cache(
+    cache_hours: int = 1, force_refresh: bool = False
+) -> tuple[List[Dict[str, Any]], str]:
+    """
+    Get issues with caching and timestamp tracking.
+
+    Returns:
+        Tuple of (issues_list, last_fetch_time)
+    """
+    # Try to load existing cache
+    cached_data = load_issues_from_file()
+
+    # Check if we need to refresh
+    need_refresh = force_refresh
+
+    if cached_data:
+        last_fetch_time = cached_data.get("fetch_timestamp_human", "Unknown")
+        fetch_timestamp = datetime.fromisoformat(cached_data["fetch_timestamp"])
+        age_hours = (datetime.now() - fetch_timestamp).total_seconds() / 3600
+        if age_hours >= cache_hours:
+            print(f"Cache is too old ({age_hours:.2f} hours), refreshing...")
+            need_refresh = True
+    else:
+        print("No cached data found, fetching new issues...")
+        need_refresh = True
+
+    if need_refresh:
+        print("Fetching new issues from GitHub...")
+        issues = get_open_issues()
+        save_issues_to_file(issues)
+        last_fetch_time = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+        return issues, last_fetch_time
+
+    return cached_data.get("issues", []), last_fetch_time
+
+
+def count_labels_from_issues(issues: List[Dict[str, Any]]) -> Counter:
+    """
+    Count labels from a list of issues.
+
+    Args:
+        issues: List of issue dictionaries
+
+    Returns:
+        Counter object with label counts
+    """
+    label_counter = Counter()
+
+    for issue in issues:
+        for label in issue["labels"]:
+            label_counter[label["name"]] += 1
+
+    return label_counter
+
+
+# USAGE EXAMPLE
+if __name__ == "__main__":
+    # Get all open issues (with caching)
+    issues, last_fetch_time = get_issues_with_cache()
+
+    # Count labels
+    label_counter = count_labels_from_issues(issues)
+
+    # OUTPUT RESULTS
+    print(f"Found {len(issues)} open issues")
+    print("\nOpen issues by label:")
+    for label, count in label_counter.most_common():
+        print(f"{label}: {count}")
+
+    # You can now work with the issues list
+    # For example, get issue titles:
+    print("\nIssue titles:")
+    for issue in issues[:5]:  # Show first 5
+        print(f"- {issue['title']}")
+
+    print(issues)