Hi,

I wrote a quick and dirty Python 3 script to track upstream package version 
including last GIT commit and commit date, so you can compare Hedora's version 
with upstream. This is slightly better than Anitya as it supports commit.

It takes as input a file containing one Fedora package per line and as output 
a "TODO Golang update.csv".

I have not put this on Github yet but if you're interested in improving it, I 
can do that. I'm not a programming specialist so I'm sure there is tons of 
errors and dirty hack in there.

I'm joining the script and an example output from almost all packages we have.

Best regards,

Robert-André
#!/usr/bin/python3
import asyncio
import aiohttp
import asyncio_throttle
import backoff
from bs4 import BeautifulSoup
import time
import re
import sys


def all_go_packages(filename):
    with open(filename) as f:
        pkgs = [line.rstrip() for line in f if line != ""]
    return pkgs


def write_to_file(data):
    f = open("TODO Golang update.csv", "a")
    f.write(data)
    f.close()


def erase():
    f = open("TODO Golang update.csv", "w")
    f.write("")
    f.close()


def extract_commit_info(fedrel):
    reldata = re.search("(\d{8})git([a-f0-9]+)", fedrel, flags=re.MULTILINE)
    if reldata:
        return reldata.group(1), reldata.group(2)
    else:
        return "", ""


def convert_date(datein):
    try:
        dateout = time.strftime("%Y%m%d", time.strptime(datein, "%b %d, %Y"))
    except:
        return datein
    return dateout


def convert_version(version_string):
    version_data = re.search(
        "v([\d+][\.\d]+)(\-\d{14}\-)*([a-f0-9]*)",
        version_string,
        flags=re.MULTILINE,
    )
    if version_data:
        version = version_data.group(1)
    else:
        return "0", ""
    if "0.0.0" in version:
        version = 0
    if version_data.group(3):
        commit = version_data.group(3)
    else:
        commit = ""
    return str(version), commit


@backoff.on_exception(
    backoff.expo, (aiohttp.ClientError, asyncio.TimeoutError), max_time=30
)
async def get_fedora_version(pkg):
    if pkg:
      url = f"https://apps.fedoraproject.org/mdapi/koji/srcpkg/{pkg}";
      timeout = aiohttp.ClientTimeout(total=60)
      async with aiohttp.ClientSession(timeout=timeout) as session:
          try:
              async with session.get(url) as resp:
                  if resp.status == 404:
                      return "unknown", "unknown"
                  resp.raise_for_status()
                  data = await resp.json()
                  ver = data["version"]
                  rel = data["release"]
                  return str(ver), str(rel)
          except asyncio.TimeoutError:
              print(f"Timeout get_fedora_version {pkg}")
          except:
              raise


@backoff.on_exception(
    backoff.expo, (aiohttp.ClientError, asyncio.TimeoutError), max_time=30
)
async def get_fedora_goipath(pkg):
    if pkg:
      url = f"https://src.fedoraproject.org/rpms/{pkg}/raw/master/f/{pkg}.spec";
      timeout = aiohttp.ClientTimeout(total=60)
      async with aiohttp.ClientSession(timeout=timeout) as session:
          try:
              async with session.get(url) as resp:
                  if resp.status == 404:
                      return "unknown"
                  resp.raise_for_status()
                  spec = await resp.text()
                  ipath = re.search("(goipath)\s+(.*)$", spec, flags=re.MULTILINE)
                  if ipath:
                      return ipath.group(2)
                  else:
                      return "unknown"
          except asyncio.TimeoutError:
              print(f"Timeout get_fedora_goipath {pkg}")
          except:
              raise


@backoff.on_exception(
    backoff.expo, (aiohttp.ClientError, asyncio.TimeoutError), max_time=30
)
async def get_upstream_version(goipath):
    url = f"https://pkg.go.dev/mod/{goipath}?tab=versions";
    timeout = aiohttp.ClientTimeout(total=60)
    async with aiohttp.ClientSession(timeout=timeout) as session:
        try:
            async with session.get(url) as resp:
                if resp.status == 404 or resp.status == 400:
                    return 0, "unknown", "unknown"
                resp.raise_for_status()
                page = await resp.text()
                soup = BeautifulSoup(page, "html.parser")
                li_elmt = soup.findAll("li", {"class": "Versions-item"})[0]
                version, commit = convert_version(li_elmt.a.string)
                commitdate = convert_date(li_elmt.span.string[3:])
                return version, commit, commitdate
        except asyncio.TimeoutError:
            print(f"Timeout get_upstream_version {pkg}")
            return get_upstream_version(goipath)
        except:
            raise


async def check_version(pkg):
    fedora_version, fedora_release = await get_fedora_version(pkg)
    goipath = await get_fedora_goipath(pkg)
    fedora_date, fedora_commit = extract_commit_info(fedora_release)
    if goipath and not "unknown" in goipath:
        upstream_version, upstream_commit, upstream_date = await get_upstream_version(
            goipath
        )
    else:
        write_to_file(
            f"{pkg} Fedora,{fedora_version},{fedora_date},{fedora_commit}\nunknown Upstream,unknown,unknown,unknown\n\n"
        )
        return
    if fedora_version == "0" and upstream_version == "0":
        if not fedora_commit in upstream_commit:
            write_to_file(
                f"{pkg} Fedora,{fedora_version},{fedora_date},{fedora_commit}\n{goipath} Upstream,{upstream_version},{upstream_date},{upstream_commit}\n\n"
            )
            return
    elif fedora_version != upstream_version:
        if not fedora_commit in upstream_commit:
            write_to_file(
                f"{pkg} Fedora,{fedora_version},{fedora_date},{fedora_commit}\n{goipath} Upstream,{upstream_version},{upstream_date},{upstream_commit}\n\n"
            )
            return
    return


async def main(loop):
    erase()
    no_concurrent = 5
    tasks = set()
    pkgs = all_go_packages(sys.argv[1])
    i = 0
    while i < len(pkgs):
        if len(tasks) >= no_concurrent:
            # Wait for some download to finish before adding a new one
            _done, tasks = await asyncio.wait(
                tasks, return_when=asyncio.FIRST_COMPLETED
            )
        tasks.add(loop.create_task(check_version(pkgs[i])))
        i += 1
    # Wait for the remaining downloads to finish
    await asyncio.wait(tasks)


if __name__ == "__main__":
    loop = asyncio.get_event_loop()
    try:
        loop.run_until_complete(main(loop))
    finally:
        loop.close()

<<attachment: TODO_Golang_update.csv.zip>>

_______________________________________________
golang mailing list -- golang@lists.fedoraproject.org
To unsubscribe send an email to golang-le...@lists.fedoraproject.org
Fedora Code of Conduct: 
https://docs.fedoraproject.org/en-US/project/code-of-conduct/
List Guidelines: https://fedoraproject.org/wiki/Mailing_list_guidelines
List Archives: 
https://lists.fedoraproject.org/archives/list/golang@lists.fedoraproject.org

Reply via email to