VOICEVOX-Engine / voicevox_engine /tools /generate_licenses.py
Jirat Jaturanpinyo
Upload voicevox_engine
edc06cb verified
raw
history blame
13.9 kB
import json
import os
import subprocess
import urllib.request
from pathlib import Path
from typing import Literal
class LicenseError(Exception):
# License違反があった場合、このエラーを出します。
pass
class License:
def __init__(
self,
package_name: str,
package_version: str | None,
license_name: str | None,
license_text: str,
license_text_type: Literal["raw", "local_address", "remote_address"],
):
self.package_name = package_name
self.package_version = package_version
self.license_name = license_name
if license_text_type == "raw":
self.license_text = license_text
elif license_text_type == "local_address":
# ライセンステキストをローカルのライセンスファイルから抽出する
self.license_text = Path(license_text).read_text(encoding="utf8")
elif license_text_type == "remote_address":
self.license_text = get_license_text(license_text)
else:
raise Exception("型で保護され実行されないはずのパスが実行されました")
def get_license_text(text_url: str) -> str:
"""URL が指すテキストを取得する。"""
with urllib.request.urlopen(text_url) as res:
# NOTE: `urlopen` 返り値の型が貧弱なため型チェックを無視する
return res.read().decode() # type: ignore
def generate_licenses() -> list[License]:
licenses: list[License] = []
# pip
try:
pip_licenses_output = subprocess.run(
"pip-licenses "
"--from=mixed "
"--format=json "
"--with-urls "
"--with-license-file "
"--no-license-path ",
shell=True,
capture_output=True,
check=True,
env=os.environ,
).stdout.decode()
except subprocess.CalledProcessError as err:
raise Exception(
f"command output:\n{err.stderr and err.stderr.decode()}"
) from err
licenses_json = json.loads(pip_licenses_output)
for license_json in licenses_json:
# ライセンス文を pip 外で取得されたもので上書きする
package_name: str = license_json["Name"].lower()
if license_json["LicenseText"] == "UNKNOWN":
if package_name == "core" and license_json["Version"] == "0.0.0":
continue
elif package_name == "future":
text_url = "https://raw.githubusercontent.com/PythonCharmers/python-future/master/LICENSE.txt" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "pefile":
text_url = "https://raw.githubusercontent.com/erocarrera/pefile/master/LICENSE" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "pyopenjtalk":
text_url = "https://raw.githubusercontent.com/r9y9/pyopenjtalk/master/LICENSE.md" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "python-multipart":
text_url = "https://raw.githubusercontent.com/andrew-d/python-multipart/master/LICENSE.txt" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "romkan":
text_url = "https://raw.githubusercontent.com/soimort/python-romkan/master/LICENSE" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "distlib":
text_url = "https://bitbucket.org/pypa/distlib/raw/7d93712134b28401407da27382f2b6236c87623a/LICENSE.txt" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "jsonschema":
text_url = "https://raw.githubusercontent.com/python-jsonschema/jsonschema/dbc398245a583cb2366795dc529ae042d10c1577/COPYING" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "lockfile":
text_url = "https://opendev.org/openstack/pylockfile/raw/tag/0.12.2/LICENSE" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "platformdirs":
text_url = "https://raw.githubusercontent.com/platformdirs/platformdirs/aa671aaa97913c7b948567f4d9c77d4f98bfa134/LICENSE" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
elif package_name == "webencodings":
text_url = "https://raw.githubusercontent.com/gsnedders/python-webencodings/fa2cb5d75ab41e63ace691bc0825d3432ba7d694/LICENSE" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
else:
# ライセンスがpypiに無い
raise Exception(f"No License info provided for {package_name}")
# soxr
if package_name == "soxr":
text_url = "https://raw.githubusercontent.com/dofuuz/python-soxr/v0.3.6/LICENSE.txt" # noqa: B950
license_json["LicenseText"] = get_license_text(text_url)
license = License(
package_name=license_json["Name"],
package_version=license_json["Version"],
license_name=license_json["License"],
license_text=license_json["LicenseText"],
license_text_type="raw",
)
# ライセンスを確認する
license_names_str = license.license_name or ""
license_names = license_names_str.split("; ")
for license_name in license_names:
if license_name in [
"GNU General Public License v2 (GPLv2)",
"GNU General Public License (GPL)",
"GNU General Public License v3 (GPLv3)",
"GNU Affero General Public License v3 (AGPL-3)",
]:
raise LicenseError(
f"ライセンス違反: {license.package_name} is {license.license_name}"
)
licenses.append(license)
python_version = "3.11.3"
licenses += [
# https://sourceforge.net/projects/open-jtalk/files/Open%20JTalk/open_jtalk-1.11/
License(
package_name="Open JTalk",
package_version="1.11",
license_name="Modified BSD license",
license_text="tools/licenses/open_jtalk/COPYING",
license_text_type="local_address",
),
License(
package_name="MeCab",
package_version=None,
license_name="Modified BSD license",
license_text="tools/licenses/open_jtalk/mecab/COPYING",
license_text_type="local_address",
),
License(
package_name="NAIST Japanese Dictionary",
package_version=None,
license_name="Modified BSD license",
license_text="tools/licenses//open_jtalk/mecab-naist-jdic/COPYING",
license_text_type="local_address",
),
License(
package_name='HTS Voice "Mei"',
package_version=None,
license_name="Creative Commons Attribution 3.0 license",
license_text="https://raw.githubusercontent.com/r9y9/pyopenjtalk/master/pyopenjtalk/htsvoice/LICENSE_mei_normal.htsvoice", # noqa: B950
license_text_type="remote_address",
),
License(
package_name="VOICEVOX CORE",
package_version=None,
license_name="MIT license",
license_text="https://raw.githubusercontent.com/VOICEVOX/voicevox_core/main/LICENSE",
license_text_type="remote_address",
),
License(
package_name="VOICEVOX ENGINE",
package_version=None,
license_name="LGPL license",
license_text="https://raw.githubusercontent.com/VOICEVOX/voicevox_engine/master/LGPL_LICENSE",
license_text_type="remote_address",
),
License(
package_name="world",
package_version=None,
license_name="Modified BSD license",
license_text="https://raw.githubusercontent.com/mmorise/World/master/LICENSE.txt",
license_text_type="remote_address",
),
License(
package_name="PyTorch",
package_version="1.9.0",
license_name="BSD-style license",
license_text="https://raw.githubusercontent.com/pytorch/pytorch/master/LICENSE",
license_text_type="remote_address",
),
License(
package_name="ONNX Runtime",
package_version="1.13.1",
license_name="MIT license",
license_text="https://raw.githubusercontent.com/microsoft/onnxruntime/master/LICENSE",
license_text_type="remote_address",
),
License(
package_name="Python",
package_version=python_version,
license_name="Python Software Foundation License",
license_text=f"https://raw.githubusercontent.com/python/cpython/v{python_version}/LICENSE",
license_text_type="remote_address",
),
# OpenBLAS
License(
package_name="OpenBLAS",
package_version=None,
license_name="BSD 3-clause license",
license_text="https://raw.githubusercontent.com/xianyi/OpenBLAS/develop/LICENSE",
license_text_type="remote_address",
),
License(
package_name="libsndfile-binaries",
package_version="1.2.0",
license_name="LGPL-2.1 license",
license_text="https://raw.githubusercontent.com/bastibe/libsndfile-binaries/d9887ef926bb11cf1a2526be4ab6f9dc690234c0/COPYING", # noqa: B950
license_text_type="remote_address",
),
License(
package_name="libogg",
package_version="1.3.5",
license_name="BSD 3-clause license",
license_text="https://raw.githubusercontent.com/xiph/ogg/v1.3.5/COPYING",
license_text_type="remote_address",
),
License(
package_name="libvorbis",
package_version="1.3.7",
license_name="BSD 3-clause license",
license_text="https://raw.githubusercontent.com/xiph/vorbis/v1.3.7/COPYING",
license_text_type="remote_address",
),
# libflac
License(
package_name="FLAC",
package_version="1.4.2",
license_name="Xiph.org's BSD-like license",
license_text="https://raw.githubusercontent.com/xiph/flac/1.4.2/COPYING.Xiph",
license_text_type="remote_address",
),
# libopus
License(
package_name="Opus",
package_version="1.3.1",
license_name="BSD 3-clause license",
license_text="https://raw.githubusercontent.com/xiph/opus/v1.3.1/COPYING",
license_text_type="remote_address",
),
# https://sourceforge.net/projects/mpg123/files/mpg123/1.30.2/
License(
package_name="mpg123",
package_version="1.30.2",
license_name="LGPL-2.1 license",
license_text="tools/licenses/mpg123/COPYING",
license_text_type="local_address",
),
# liblame
# https://sourceforge.net/projects/lame/files/lame/3.100/
License(
package_name="lame",
package_version="3.100",
license_name="LGPL-2.0 license",
license_text="https://svn.code.sf.net/p/lame/svn/tags/RELEASE__3_100/lame/COPYING",
license_text_type="remote_address",
),
# license text from CUDA 11.8.0
# https://developer.nvidia.com/cuda-11-8-0-download-archive?target_os=Windows&target_arch=x86_64&target_version=10&target_type=exe_local # noqa: B950
# https://developer.download.nvidia.com/compute/cuda/11.8.0/local_installers/cuda_11.8.0_522.06_windows.exe # noqa: B950
# cuda_11.8.0_522.06_windows.exe (cuda_documentation/Doc/EULA.txt)
License(
package_name="CUDA Toolkit",
package_version="11.8.0",
license_name=None,
license_text="tools/licenses/cuda/EULA.txt",
license_text_type="local_address",
),
# license text from cuDNN v8.9.2 (June 1st, 2023), for CUDA 11.x, cuDNN Library for Windows # noqa: B950
# https://developer.nvidia.com/rdp/cudnn-archive # noqa: B950
# https://developer.download.nvidia.com/compute/cudnn/redist/cudnn/windows-x86_64/cudnn-windows-x86_64-8.9.2.26_cuda11-archive.zip # noqa: B950
# cudnn-windows-x86_64-8.9.2.26_cuda11-archive.zip (cudnn-windows-x86_64-8.9.2.26_cuda11-archive/LICENSE) # noqa: B950
License(
package_name="cuDNN",
package_version="8.9.2",
license_name=None,
license_text="tools/licenses/cudnn/LICENSE",
license_text_type="local_address",
),
]
return licenses
if __name__ == "__main__":
import argparse
import sys
parser = argparse.ArgumentParser()
parser.add_argument("-o", "--output_path", type=str)
args = parser.parse_args()
output_path = args.output_path
licenses = generate_licenses()
# dump
out = Path(output_path).open("w") if output_path else sys.stdout
json.dump(
[
{
"name": license.package_name,
"version": license.package_version,
"license": license.license_name,
"text": license.license_text,
}
for license in licenses
],
out,
)