Add script for license scanner (#2267)

* Add script for license scanner

This script will scan the source tree for license files and generate a file with the contents of all the licenses.

Signed-off-by: brianherrera <briher@amazon.com>
main
Brian Herrera 4 years ago committed by GitHub
parent d640e7ea30
commit 173126f5a5
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -0,0 +1,129 @@
#
# Copyright (c) Contributors to the Open 3D Engine Project. For complete copyright and license terms please see the LICENSE at the root of this distribution.
#
# SPDX-License-Identifier: Apache-2.0 OR MIT
#
#
import argparse
import fnmatch
import json
import os
import pathlib
import re
import sys
class LicenseScanner:
"""Class to contain license scanner.
Scans source tree for license files using provided filename patterns and generates a file
with the contents of all the licenses.
:param config_file: Config file with license patterns and scanner settings
"""
DEFAULT_CONFIG_FILE = 'scanner_config.json'
def __init__(self, config_file=None):
self.config_file = config_file
self.config_data = self._load_config()
self.license_regex = self._load_license_regex()
def _load_config(self):
"""Load config from the provided file. Sets default file if one is not provided."""
if self.config_file is None:
script_directory = os.path.dirname(os.path.abspath(__file__)) # Default file expected in same dir as script
self.config_file = os.path.join(script_directory, self.DEFAULT_CONFIG_FILE)
try:
with open(self.config_file) as f:
return json.load(f)
except FileNotFoundError:
print('Config file cannot be found')
raise
def _load_license_regex(self):
"""Returns regex object with case-insensitive matching from the list of filename patterns."""
regex_patterns = []
for pattern in self.config_data['license_patterns']:
regex_patterns.append(fnmatch.translate(pattern))
return re.compile('|'.join(regex_patterns), re.IGNORECASE)
def scan(self, path=os.curdir):
"""Scan directory tree for filenames matching license_regex.
:param path: Path of the directory to run scanner
:return: Package paths and their corresponding license file contents
:rtype: dict
"""
licenses = 0
license_files = {}
for dirpath, dirnames, filenames in os.walk(path):
for file in filenames:
if self.license_regex.match(file):
license_file_content = self._get_license_file_contents(os.path.join(dirpath, file))
rel_dirpath = os.path.relpath(dirpath, path) # Limit path inside scanned directory
license_files[rel_dirpath] = license_file_content
licenses += 1
print(f'License file: {os.path.join(dirpath, file)}')
# Remove directories that should not be scanned
for dir in self.config_data['excluded_directories']:
if dir in dirnames:
dirnames.remove(dir)
print(f'{licenses} license files found.')
return license_files
def _get_license_file_contents(self, filepath):
try:
with open(filepath, encoding='utf8') as f:
return f.read()
except UnicodeDecodeError:
print(f'Unable to read license file: {filepath}')
pass
def create_license_file(self, licenses, filepath='NOTICES.txt'):
"""Creates file with all the provided license file contents.
:param licenses: Dict with package paths and their corresponding license file contents
:param filepath: Path to write the file
"""
package_separator = '------------------------------------'
with open(filepath, 'w', encoding='utf8') as f:
for directory, license in licenses.items():
license_output = '\n\n'.join([
f'{package_separator}',
f'Package path: {directory}',
'License:',
f'{license}\n'
])
f.write(license_output)
return None
def parse_args():
parser = argparse.ArgumentParser(
description='Script to run LicenseScanner and generate license file')
parser.add_argument('--config-file', '-c', type=pathlib.Path, help='Config file for LicenseScanner')
parser.add_argument('--license-file-path', '-l', type=pathlib.Path, help='Create license file in the provided path')
parser.add_argument('--scan-path', '-s', default=os.curdir, type=pathlib.Path, help='Path to scan')
return parser.parse_args()
def main():
try:
args = parse_args()
ls = LicenseScanner(args.config_file)
licenses = ls.scan(args.scan_path)
if args.license_file_path:
ls.create_license_file(licenses, args.license_file_path)
except FileNotFoundError as e:
print(f'Type: {type(e).__name__}, Error: {e}')
return 1
if __name__ == '__main__':
sys.exit(main())

@ -0,0 +1,12 @@
{
"excluded_directories": [
".git",
".venv",
"build",
"license_scanner"
],
"license_patterns": [
"LICENSE*",
"COPYING*"
]
}
Loading…
Cancel
Save