mirror-checker/projects/ubuntu_ports_releases.py

from bs4 import BeautifulSoup
import requests
import re
import datefinder  # another date finding library
from project import Project
from shared import CSC_MIRROR

class ubuntu_ports_releases(Project):
    """ubuntu_ports_releases class"""
    @staticmethod
    def checker(directory_URL, file_name):
        page = requests.get(directory_URL).text
        file_index = page.find(file_name)
        # print(page)

        if file_index == -1:
            return False

        str_dates = re.findall(r'(\d{2}-\w{3}-\d{4} \d{2}:\d{2})|(\d{4}-\d{2}-\d{2} \d{2}:\d{2})', page[file_index:])

        return list(datefinder.find_dates("".join(str_dates[0])))[0]

    @classmethod
    def scrape(cls, compare, folders, site1, site2, directory):
        if cls.checker(site1+directory, "MD5SUMS") != False:
            # print (site1+directory)
            # print (cls.checker(site1+directory, "MD5SUMS"))
            if cls.checker(site2+directory, "MD5SUMS") != False:
                # print (site2+directory)
                # print (cls.checker(site2+directory, "MD5SUMS"))
                compare.append(cls.checker(site1+directory, "MD5SUMS") <= cls.checker(site2+directory, "MD5SUMS"))
                return
            compare.append(False)
            return
        elif cls.checker(site1+directory, "SHA256SUMS") != False:
            # print (site1+directory)
            # print (cls.checker(site1+directory, "SHA256SUMS"))
            if cls.checker(site2+directory, "SHA256SUMS") != False:
                # print (site2+directory)
                # print (cls.checker(site2+directory, "SHA256SUMS"))
                compare.append(cls.checker(site1+directory, "SHA256SUMS") <= cls.checker(site2+directory, "SHA256SUMS"))
                return
            compare.append(False)
            return

        # getting the request from url
        r = requests.get(site1 + directory)

        # converting the text
        s = BeautifulSoup(r.text,"html.parser")

        for i in s.find_all("a"): # for a href directories
            href = i.attrs['href']
            
            if href.endswith("/") and href != "../" and href != "/" and not href.startswith("/") and not href.startswith("http://"):
                dir_next = directory+href
                # print(dir_next)
                # calling it self
                if dir_next not in folders:
                    folders.append(dir_next)
                    cls.scrape(compare, folders, site1, site2, dir_next)

    @classmethod
    def check(cls, data, project, current_time):
        """Check if project packages are up-to-date"""
        # lists
        compare=[]
        folders=[]

        csc_url = CSC_MIRROR + data[project]["csc"] + data[project]["file"]
        upstream_url = data[project]["upstream"] + data[project]["file"]

        # calling function
        cls.scrape(compare, folders, upstream_url, csc_url, "")

        return all(compare)
added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00			`from bs4 import BeautifulSoup`
			`import requests`
			`import re`
changed linuxmint, ubuntu_ports_releases, xubuntu_releases 2021-10-18 01:23:55 -04:00			`import datefinder # another date finding library`
added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00			`from project import Project`
			`from shared import CSC_MIRROR`

			`class ubuntu_ports_releases(Project):`
			`"""ubuntu_ports_releases class"""`
changed linuxmint, ubuntu_ports_releases, xubuntu_releases 2021-10-18 01:23:55 -04:00			`@staticmethod`
			`def checker(directory_URL, file_name):`
			`page = requests.get(directory_URL).text`
			`file_index = page.find(file_name)`
			`# print(page)`

			`if file_index == -1:`
			`return False`

			`str_dates = re.findall(r'(\d{2}-\w{3}-\d{4} \d{2}:\d{2})\|(\d{4}-\d{2}-\d{2} \d{2}:\d{2})', page[file_index:])`

			`return list(datefinder.find_dates("".join(str_dates[0])))[0]`

added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00			`@classmethod`
changed linuxmint, ubuntu_ports_releases, xubuntu_releases 2021-10-18 01:23:55 -04:00			`def scrape(cls, compare, folders, site1, site2, directory):`
			`if cls.checker(site1+directory, "MD5SUMS") != False:`
			`# print (site1+directory)`
			`# print (cls.checker(site1+directory, "MD5SUMS"))`
			`if cls.checker(site2+directory, "MD5SUMS") != False:`
			`# print (site2+directory)`
			`# print (cls.checker(site2+directory, "MD5SUMS"))`
			`compare.append(cls.checker(site1+directory, "MD5SUMS") <= cls.checker(site2+directory, "MD5SUMS"))`
			`return`
			`compare.append(False)`
			`return`
			`elif cls.checker(site1+directory, "SHA256SUMS") != False:`
			`# print (site1+directory)`
			`# print (cls.checker(site1+directory, "SHA256SUMS"))`
			`if cls.checker(site2+directory, "SHA256SUMS") != False:`
			`# print (site2+directory)`
			`# print (cls.checker(site2+directory, "SHA256SUMS"))`
			`compare.append(cls.checker(site1+directory, "SHA256SUMS") <= cls.checker(site2+directory, "SHA256SUMS"))`
			`return`
			`compare.append(False)`
			`return`

added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00			`# getting the request from url`
changed linuxmint, ubuntu_ports_releases, xubuntu_releases 2021-10-18 01:23:55 -04:00			`r = requests.get(site1 + directory)`

added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00			`# converting the text`
			`s = BeautifulSoup(r.text,"html.parser")`

			`for i in s.find_all("a"): # for a href directories`
			`href = i.attrs['href']`

			`if href.endswith("/") and href != "../" and href != "/" and not href.startswith("/") and not href.startswith("http://"):`
changed linuxmint, ubuntu_ports_releases, xubuntu_releases 2021-10-18 01:23:55 -04:00			`dir_next = directory+href`
			`# print(dir_next)`
			`# calling it self`
			`if dir_next not in folders:`
			`folders.append(dir_next)`
			`cls.scrape(compare, folders, site1, site2, dir_next)`
added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00
			`@classmethod`
Fix parameter mismatch 2022-01-01 14:54:28 -05:00			`def check(cls, data, project, current_time):`
added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00			`"""Check if project packages are up-to-date"""`
			`# lists`
changed linuxmint, ubuntu_ports_releases, xubuntu_releases 2021-10-18 01:23:55 -04:00			`compare=[]`
			`folders=[]`
added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00
			`csc_url = CSC_MIRROR + data[project]["csc"] + data[project]["file"]`
			`upstream_url = data[project]["upstream"] + data[project]["file"]`

			`# calling function`
changed linuxmint, ubuntu_ports_releases, xubuntu_releases 2021-10-18 01:23:55 -04:00			`cls.scrape(compare, folders, upstream_url, csc_url, "")`
added linuxmint, linuxmint-packages, raspberry pi, ubuntu-ports-releases, and xubuntu-releases 2021-10-14 21:22:39 -04:00
Fix parameter mismatch 2022-01-01 14:54:28 -05:00			`return all(compare)`