#!/usr/bin/env python3

# Copyright (C) 2020  Matthew "strager" Glazar
# See end of file for extended copyright information.

import argparse
import collections
import json
import pathlib
import re
import subprocess
import sys
import typing
import unittest


def main() -> None:
    parser = argparse.ArgumentParser(__doc__)
    parser.add_argument("build_sizes_directory")
    args = parser.parse_args()

    build_sizes_directory = pathlib.Path(args.build_sizes_directory)
    git_commits = get_git_commits()
    all_builds = []
    for build_sizes_file in build_sizes_directory.iterdir():
        if build_sizes_file.suffix != ".json":
            continue
        content = build_sizes_file.read_text()
        if not content:
            sys.stderr.write(f"warning: file is empty: {build_sizes_file}\n")
            continue
        all_builds.append(json.loads(content))
    series = group_build_sizes(builds=all_builds, git_rev_list=git_commits)
    json.dump(series, sys.stdout, indent=2)


def get_git_commits() -> typing.List[str]:
    return subprocess.check_output(
        ["git", "rev-list", "--reverse", "--topo-order", "HEAD"],
        cwd=pathlib.Path(__file__).parent,
        encoding="utf-8",
    ).splitlines()


class TestGroupBuildSizes(unittest.TestCase):
    def test_group_basic_builds(self) -> None:
        builds = [
            {
                "readme": {"Git-Commit": "1"},
                "sizes": [
                    {"name": ["program.exe"], "type": "exe", "size": 42},
                    {"name": ["lib.js"], "type": "file", "size": 100},
                ],
            },
            {
                "readme": {"Git-Commit": "2"},
                "sizes": [
                    {"name": ["program.exe"], "type": "exe", "size": 44},
                    {"name": ["lib.js"], "type": "file", "size": 100},
                ],
            },
        ]
        git_rev_list = ["1", "2"]

        grouped_builds = group_build_sizes(builds, git_rev_list=git_rev_list)
        self.assertEqual(
            grouped_builds,
            [
                {
                    "name": ["lib.js"],
                    "type": "file",
                    "sizes": [
                        {"commit": "1", "size": 100},
                        {"commit": "2", "size": 100},
                    ],
                },
                {
                    "name": ["program.exe"],
                    "type": "exe",
                    "sizes": [
                        {"commit": "1", "size": 42},
                        {"commit": "2", "size": 44},
                    ],
                },
            ],
        )

    def test_commit_with_missing_build_has_null_size(self) -> None:
        builds = [
            {
                "readme": {"Git-Commit": "1"},
                "sizes": [
                    {"name": ["lib.js"], "type": "file", "size": 100},
                ],
            },
            {
                "readme": {"Git-Commit": "2"},
                "sizes": [
                    {"name": ["program.exe"], "type": "exe", "size": 42},
                    {"name": ["lib.js"], "type": "file", "size": 100},
                ],
            },
        ]
        git_rev_list = ["1", "2"]

        grouped_builds = group_build_sizes(builds, git_rev_list=git_rev_list)
        self.assertEqual(
            grouped_builds,
            [
                {
                    "name": ["lib.js"],
                    "type": "file",
                    "sizes": [
                        {"commit": "1", "size": 100},
                        {"commit": "2", "size": 100},
                    ],
                },
                {
                    "name": ["program.exe"],
                    "type": "exe",
                    "sizes": [
                        {"commit": "1", "size": None},
                        {"commit": "2", "size": 42},
                    ],
                },
            ],
        )

    def test_commit_with_no_build_has_no_entry(self) -> None:
        builds = [
            {
                "readme": {"Git-Commit": "1"},
                "sizes": [
                    {"name": ["lib.js"], "type": "file", "size": 100},
                ],
            },
            {
                "readme": {"Git-Commit": "3"},
                "sizes": [
                    {"name": ["lib.js"], "type": "file", "size": 100},
                ],
            },
        ]
        git_rev_list = ["0", "1", "2", "3", "4"]

        grouped_builds = group_build_sizes(builds, git_rev_list=git_rev_list)
        self.assertEqual(
            grouped_builds,
            [
                {
                    "name": ["lib.js"],
                    "type": "file",
                    "sizes": [
                        {"commit": "1", "size": 100},
                        {"commit": "3", "size": 100},
                    ],
                },
            ],
        )

    def test_builds_with_different_version_numbers_are_grouped_together(self) -> None:
        builds = [
            {
                "readme": {"Git-Commit": "2"},
                "sizes": [
                    {
                        "name": [
                            "npm/quick-lint-js-0.2.0.tgz",
                            "package/linux/bin/quick-lint-js",
                        ],
                        "type": "exe",
                        "size": 100,
                    },
                    {
                        "name": [
                            "npm/quick-lint-js-0.2.0.tgz",
                            "package/windows/bin/quick-lint-js.exe",
                        ],
                        "type": "exe",
                        "size": 150,
                    },
                    {
                        "name": ["debian/quick-lint-js_0.2.0-1_amd64.deb"],
                        "type": "file",
                        "size": 175,
                    },
                ],
            },
            {
                "readme": {"Git-Commit": "3"},
                "sizes": [
                    {
                        "name": [
                            "npm/quick-lint-js-0.3.0.tgz",
                            "package/linux/bin/quick-lint-js",
                        ],
                        "type": "exe",
                        "size": 200,
                    },
                    {
                        "name": [
                            "npm/quick-lint-js-0.3.0.tgz",
                            "package/windows/bin/quick-lint-js.exe",
                        ],
                        "type": "exe",
                        "size": 250,
                    },
                    {
                        "name": ["debian/quick-lint-js_0.3.0-1_amd64.deb"],
                        "type": "file",
                        "size": 275,
                    },
                ],
            },
        ]
        git_rev_list = ["2", "3"]

        grouped_builds = group_build_sizes(builds, git_rev_list=git_rev_list)
        self.assertEqual(
            grouped_builds,
            [
                {
                    "name": ["debian/quick-lint-js_*-1_amd64.deb"],
                    "type": "file",
                    "sizes": [
                        {"commit": "2", "size": 175},
                        {"commit": "3", "size": 275},
                    ],
                },
                {
                    "name": [
                        "npm/quick-lint-js-*.tgz",
                        "package/linux/bin/quick-lint-js",
                    ],
                    "type": "exe",
                    "sizes": [
                        {"commit": "2", "size": 100},
                        {"commit": "3", "size": 200},
                    ],
                },
                {
                    "name": [
                        "npm/quick-lint-js-*.tgz",
                        "package/windows/bin/quick-lint-js.exe",
                    ],
                    "type": "exe",
                    "sizes": [
                        {"commit": "2", "size": 150},
                        {"commit": "3", "size": 250},
                    ],
                },
            ],
        )


def group_build_sizes(
    builds: typing.List, git_rev_list: typing.List[str]
) -> typing.List:
    def builds_for_commit(commit: str):
        result = []
        for build in builds:
            readme = build.get("readme")
            if readme is None:
                continue
            if readme.get("Git-Commit") == commit:
                result.append(build)
        return result

    class SeriesKey(typing.NamedTuple):
        name: typing.Tuple[str, ...]
        type: str

    def series_key_for_sample(sample) -> SeriesKey:
        return SeriesKey(
            name=tuple(scrub_version_number(part) for part in sample["name"]),
            type=sample["type"],
        )

    def scrub_version_number(s: str) -> str:
        return re.sub(r"(^|(?<=\D))\d+\.\d+\.\d+(?=\D|$)", "*", s)

    all_series_keys = set()
    for build in builds:
        for sample in build["sizes"]:
            all_series_keys.add(series_key_for_sample(sample))

    series: typing.Mapping[SeriesKey, typing.List] = collections.defaultdict(list)

    for git_commit in git_rev_list:
        for build in builds_for_commit(git_commit):
            size_by_series_key = {
                series_key_for_sample(sample): sample["size"]
                for sample in build["sizes"]
            }
            for series_key in all_series_keys:
                series[series_key].append(
                    {
                        "commit": git_commit,
                        "size": size_by_series_key.get(series_key, None),
                    }
                )

    return sorted(
        [
            {
                "name": list(key.name),
                "type": key.type,
                "sizes": value,
            }
            for (key, value) in series.items()
        ],
        key=lambda series: series["name"],
    )


if __name__ == "__main__":
    main()

# quick-lint-js finds bugs in JavaScript programs.
# Copyright (C) 2020  Matthew "strager" Glazar
#
# This file is part of quick-lint-js.
#
# quick-lint-js is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# quick-lint-js is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with quick-lint-js.  If not, see <https://www.gnu.org/licenses/>.
