electron/script/check-relative-doc-links.py

#!/usr/bin/env python

from __future__ import print_function
import os
import sys
import re


SOURCE_ROOT = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))
DOCS_DIR = os.path.join(SOURCE_ROOT, 'docs')


def main():
  os.chdir(SOURCE_ROOT)

  filepaths = []
  totalDirs = 0
  try:
    for root, dirs, files in os.walk(DOCS_DIR):
      totalDirs += len(dirs)
      for f in files:
        if f.endswith('.md'):
          filepaths.append(os.path.join(root, f))
  except KeyboardInterrupt:
    print('Keyboard interruption. Please try again.')
    return 0

  totalBrokenLinks = 0
  for path in filepaths:
    totalBrokenLinks += getBrokenLinks(path)

  print('Parsed through ' + str(len(filepaths)) +
        ' files within docs directory and its ' +
        str(totalDirs) + ' subdirectories.')
  print('Found ' + str(totalBrokenLinks) + ' broken relative links.')
  return totalBrokenLinks


def getBrokenLinks(filepath):
  currentDir = os.path.dirname(filepath)
  brokenLinks = []

  try:
    f = open(filepath, 'r')
    lines = f.readlines()
  except KeyboardInterrupt:
    print('Keyboard interruption while parsing. Please try again.')
  finally:
    f.close()

  linkRegexLink = re.compile('\[(.*?)\]\((?P<link>(.*?))\)')
  referenceLinkRegex = re.compile(
      '^\s{0,3}\[.*?\]:\s*(?P<link>[^<\s]+|<[^<>\r\n]+>)'
  )
  links = []
  for line in lines:
    matchLinks = linkRegexLink.search(line)
    matchReferenceLinks = referenceLinkRegex.search(line)
    if matchLinks:
      relativeLink = matchLinks.group('link')
      if not str(relativeLink).startswith('http'):
        links.append(relativeLink)
    if matchReferenceLinks:
      referenceLink = matchReferenceLinks.group('link').strip('<>')
      if not str(referenceLink).startswith('http'):
        links.append(referenceLink)

  for link in links:
    sections = link.split('#')
    if len(sections) < 2:
      if not os.path.isfile(os.path.join(currentDir, link)):
        brokenLinks.append(link)
    elif str(link).startswith('#'):
      if not checkSections(sections, lines):
        brokenLinks.append(link)
    else:
      tempFile = os.path.join(currentDir, sections[0])
      if os.path.isfile(tempFile):
        try:
          newFile = open(tempFile, 'r')
          newLines = newFile.readlines()
        except KeyboardInterrupt:
          print('Keyboard interruption while parsing. Please try again.')
        finally:
          newFile.close()

        if not checkSections(sections, newLines):
          brokenLinks.append(link)
      else:
        brokenLinks.append(link)


  print_errors(filepath, brokenLinks)
  return len(brokenLinks)


def checkSections(sections, lines):
  invalidCharsRegex = '[^A-Za-z0-9_ \-]'
  sectionHeader = sections[1]
  regexSectionTitle = re.compile('# (?P<header>.*)')
  for line in lines:
    matchHeader = regexSectionTitle.search(line)
    if matchHeader:
      # This does the following to slugify a header name:
      #  * Replace whitespace with dashes
      #  * Strip anything that's not alphanumeric or a dash
      #  * Anything quoted with backticks (`) is an exception and will
      #    not have underscores stripped
      matchHeader = str(matchHeader.group('header')).replace(' ', '-')
      matchHeader = ''.join(
        map(
          lambda match: re.sub(invalidCharsRegex, '', match[0])
          + re.sub(invalidCharsRegex + '|_', '', match[1]),
          re.findall('(`[^`]+`)|([^`]+)', matchHeader),
        )
      )
      if matchHeader.lower() == sectionHeader:
        return True
  return False


def print_errors(filepath, brokenLink):
  if brokenLink:
    print("File Location: " + filepath)
    for link in brokenLink:
      print("\tBroken links: " + link)


if __name__ == '__main__':
  sys.exit(main())
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`#!/usr/bin/env python`

fix: use print() function in both Python 2 and Python 3 (#18395) Legacy print statements are syntax errors in Python 3 but print() function works as expected in both Python 2 and Python 3. Old style exceptions are syntax errors in Python 3 but new style exceptions work as expected in both Python 2 and Python 3. 2019-06-15 17:26:09 +00:00			`from __future__ import print_function`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`import os`
			`import sys`
			`import re`


			`SOURCE_ROOT = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))`
			`DOCS_DIR = os.path.join(SOURCE_ROOT, 'docs')`


			`def main():`
			`os.chdir(SOURCE_ROOT)`

			`filepaths = []`
test for relative links adheres to npm run lint 2017-12-14 03:06:16 +00:00			`totalDirs = 0`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`try:`
			`for root, dirs, files in os.walk(DOCS_DIR):`
test for relative links adheres to npm run lint 2017-12-14 03:06:16 +00:00			`totalDirs += len(dirs)`
			`for f in files:`
			`if f.endswith('.md'):`
			`filepaths.append(os.path.join(root, f))`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`except KeyboardInterrupt:`
			`print('Keyboard interruption. Please try again.')`
chore: fix pylint-2.7 errors (#33233) 2022-03-21 02:11:21 +00:00			`return 0`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00
			`totalBrokenLinks = 0`
			`for path in filepaths:`
			`totalBrokenLinks += getBrokenLinks(path)`

test for relative links adheres to npm run lint 2017-12-14 03:06:16 +00:00			`print('Parsed through ' + str(len(filepaths)) +`
			`' files within docs directory and its ' +`
			`str(totalDirs) + ' subdirectories.')`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`print('Found ' + str(totalBrokenLinks) + ' broken relative links.')`
chore: fix relative links in docs and enforce we dont break them again (#14832) 2018-09-28 03:16:38 +00:00			`return totalBrokenLinks`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00

			`def getBrokenLinks(filepath):`
			`currentDir = os.path.dirname(filepath)`
			`brokenLinks = []`

			`try:`
test for relative links adheres to npm run lint 2017-12-14 03:06:16 +00:00			`f = open(filepath, 'r')`
			`lines = f.readlines()`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`except KeyboardInterrupt:`
build: fix typos in script messages (#25766) 2020-10-05 14:38:50 +00:00			`print('Keyboard interruption while parsing. Please try again.')`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`finally:`
test for relative links adheres to npm run lint 2017-12-14 03:06:16 +00:00			`f.close()`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00
docs: improve relative link linting and fix broken (#26020) 2020-10-20 01:46:27 +00:00			`linkRegexLink = re.compile('\[(.?)\]\((?P<link>(.?))\)')`
chore: cleanup pylint violations (#26252) * chore: cleanup pylint violations * chore: cleanup pylint violatins 2020-11-02 06:43:21 +00:00			`referenceLinkRegex = re.compile(`
			`'^\s{0,3}\[.?\]:\s(?P<link>[^<\s]+\|<[^<>\r\n]+>)'`
			`)`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`links = []`
			`for line in lines:`
docs: improve relative link linting and fix broken (#26020) 2020-10-20 01:46:27 +00:00			`matchLinks = linkRegexLink.search(line)`
			`matchReferenceLinks = referenceLinkRegex.search(line)`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`if matchLinks:`
docs: improve relative link linting and fix broken (#26020) 2020-10-20 01:46:27 +00:00			`relativeLink = matchLinks.group('link')`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`if not str(relativeLink).startswith('http'):`
			`links.append(relativeLink)`
docs: improve relative link linting and fix broken (#26020) 2020-10-20 01:46:27 +00:00			`if matchReferenceLinks:`
			`referenceLink = matchReferenceLinks.group('link').strip('<>')`
			`if not str(referenceLink).startswith('http'):`
			`links.append(referenceLink)`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00
			`for link in links:`
			`sections = link.split('#')`
chore: fix python lint warnings (#14638) * chore: fix lint warnings * chore: another try at python import errors Looks like the problem is that dbus_mock.py is running as a script but living in the `lib/` directory where it's part of a module. Moving it up into the `script/` directory seems to solve the issue. 2018-09-16 17:24:07 +00:00			`if len(sections) < 2:`
			`if not os.path.isfile(os.path.join(currentDir, link)):`
			`brokenLinks.append(link)`
			`elif str(link).startswith('#'):`
			`if not checkSections(sections, lines):`
			`brokenLinks.append(link)`
			`else:`
			`tempFile = os.path.join(currentDir, sections[0])`
			`if os.path.isfile(tempFile):`
			`try:`
			`newFile = open(tempFile, 'r')`
			`newLines = newFile.readlines()`
			`except KeyboardInterrupt:`
build: fix typos in script messages (#25766) 2020-10-05 14:38:50 +00:00			`print('Keyboard interruption while parsing. Please try again.')`
chore: fix python lint warnings (#14638) * chore: fix lint warnings * chore: another try at python import errors Looks like the problem is that dbus_mock.py is running as a script but living in the `lib/` directory where it's part of a module. Moving it up into the `script/` directory seems to solve the issue. 2018-09-16 17:24:07 +00:00			`finally:`
			`newFile.close()`

			`if not checkSections(sections, newLines):`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`brokenLinks.append(link)`
			`else:`
			`brokenLinks.append(link)`

chore: fix python lint warnings (#14638) * chore: fix lint warnings * chore: another try at python import errors Looks like the problem is that dbus_mock.py is running as a script but living in the `lib/` directory where it's part of a module. Moving it up into the `script/` directory seems to solve the issue. 2018-09-16 17:24:07 +00:00
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`print_errors(filepath, brokenLinks)`
			`return len(brokenLinks)`


test for relative links adheres to npm run lint 2017-12-14 03:06:16 +00:00			`def checkSections(sections, lines):`
chore: improve docs relative link linting (#26359) 2020-11-18 19:55:11 +00:00			`invalidCharsRegex = '[^A-Za-z0-9_ \-]'`
			`sectionHeader = sections[1]`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`regexSectionTitle = re.compile('# (?P<header>.*)')`
			`for line in lines:`
			`matchHeader = regexSectionTitle.search(line)`
			`if matchHeader:`
chore: improve docs relative link linting (#26359) 2020-11-18 19:55:11 +00:00			`# This does the following to slugify a header name:`
			`# * Replace whitespace with dashes`
			`# * Strip anything that's not alphanumeric or a dash`
			# * Anything quoted with backticks (`) is an exception and will
			`# not have underscores stripped`
			`matchHeader = str(matchHeader.group('header')).replace(' ', '-')`
			`matchHeader = ''.join(`
			`map(`
			`lambda match: re.sub(invalidCharsRegex, '', match[0])`
			`+ re.sub(invalidCharsRegex + '\|_', '', match[1]),`
			re.findall('(`[^`]+`)\|([^`]+)', matchHeader),
			`)`
			`)`
			`if matchHeader.lower() == sectionHeader:`
			`return True`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`return False`


			`def print_errors(filepath, brokenLink):`
			`if brokenLink:`
fix: use print() function in both Python 2 and Python 3 (#18395) Legacy print statements are syntax errors in Python 3 but print() function works as expected in both Python 2 and Python 3. Old style exceptions are syntax errors in Python 3 but new style exceptions work as expected in both Python 2 and Python 3. 2019-06-15 17:26:09 +00:00			`print("File Location: " + filepath)`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00			`for link in brokenLink:`
fix: use print() function in both Python 2 and Python 3 (#18395) Legacy print statements are syntax errors in Python 3 but print() function works as expected in both Python 2 and Python 3. Old style exceptions are syntax errors in Python 3 but new style exceptions work as expected in both Python 2 and Python 3. 2019-06-15 17:26:09 +00:00			`print("\tBroken links: " + link)`
:white_check_mark: Add test to check for relative links in docs directory 2017-12-13 02:32:47 +00:00

			`if __name__ == '__main__':`
			`sys.exit(main())`