Merge branch 'main' into dev/mldb (292aa183) · Commits · git-mirror / Imgutils

.github/workflows/doc.yml

+83 −0

Original line number	Diff line number	Diff line
		@@ -10,8 +10,77 @@ on:
		types: [ published ]

		jobs:
		contents:
		runs-on: ubuntu-latest
		if: "!contains(github.event.head_commit.message, 'ci skip')"
		strategy:
		matrix:
		python-version: [ 3.7 ]

		services:
		plantuml:
		image: plantuml/plantuml-server
		ports:
		- 18080:8080

		steps:
		- name: Set Swap Space
		uses: pierotofy/set-swap-space@master
		with:
		swap-size-gb: 8
		- name: Checkout code
		uses: actions/checkout@v2
		with:
		fetch-depth: 20
		submodules: 'recursive'
		- name: Set up Python ${{ matrix.python-version }}
		uses: actions/setup-python@v2
		with:
		python-version: ${{ matrix.python-version }}
		- name: Install dependencies
		run: \|
		sudo apt-get update -y
		sudo apt-get install -y make wget curl cloc graphviz pandoc
		dot -V
		python -m pip install -r requirements.txt
		python -m pip install -r requirements-doc.txt
		- name: Prepare dataset
		uses: nick-fields/retry@v2
		env:
		CI: 'true'
		HF_NARUGO_USERNAME: ${{ secrets.HF_NARUGO_USERNAME }}
		HF_NARUGO_PASSWORD: ${{ secrets.HF_NARUGO_PASSWORD }}
		with:
		shell: bash
		timeout_minutes: 20
		max_attempts: 5
		retry_on: any
		command: \|
		make dataset
		- name: Generate the contents
		env:
		ENV_PROD: 'true'
		PLANTUML_HOST: http://localhost:18080
		run: \|
		plantumlcli -c
		make docs
		- name: Change Commit
		id: commit
		run: \|
		git config user.name 'narugo1992'
		git config user.email 'narugo@126.com'
		git add -A
		git diff-index --quiet HEAD \|\| git commit -a -m "dev(narugo): auto sync $(date -R)"
		- name: Push changes
		uses: ad-m/github-push-action@master
		with:
		github_token: ${{ secrets.GITHUB_TOKEN }}
		branch: ${{ github.ref }}

		doc:
		runs-on: ubuntu-latest
		needs:
		- contents
		if: "!contains(github.event.head_commit.message, 'ci skip')"
		strategy:
		matrix:
		@@ -44,11 +113,25 @@ jobs:
		dot -V
		python -m pip install -r requirements.txt
		python -m pip install -r requirements-doc.txt
		- name: Prepare dataset
		uses: nick-fields/retry@v2
		env:
		CI: 'true'
		HF_NARUGO_USERNAME: ${{ secrets.HF_NARUGO_USERNAME }}
		HF_NARUGO_PASSWORD: ${{ secrets.HF_NARUGO_PASSWORD }}
		with:
		shell: bash
		timeout_minutes: 20
		max_attempts: 5
		retry_on: any
		command: \|
		make dataset
		- name: Generate
		env:
		ENV_PROD: 'true'
		PLANTUML_HOST: http://localhost:18080
		run: \|
		git pull
		git fetch --all --tags
		git branch -av
		git remote -v

.gitignore

+1 −0

Original line number	Diff line number	Diff line
		@@ -1205,6 +1205,7 @@ fabric.properties
		/docs/source/*/.sh.err
		/docs/source/*/.sh.exitcode
		/docs/source/*/.dat.*
		!/docs/source/*/.benchmark.py.*
		!/docs/source/_static/*/
		/docs/source/*/.result.ipynb
		/cartpole_dqn_*

docs/Makefile

+6 −1

Original line number	Diff line number	Diff line
		@@ -11,6 +11,8 @@ BUILDDIR ?= ${PROJ_DIR}/build
		ALL_MK := ${SOURCEDIR}/all.mk
		ALL := $(MAKE) -f "${ALL_MK}" SOURCE=${SOURCEDIR}

		BMS := $(shell find ${SOURCEDIR} -name 'benchmark_.dat.')

		.EXPORT_ALL_VARIABLES:

		NO_CONTENTS_BUILD = true
		@@ -42,3 +44,6 @@ sourcedir:
		@echo $(shell readlink -f ${SOURCEDIR})
		builddir:
		@echo $(shell readlink -f ${BUILDDIR}/html)

		cleanbm:
		$(ALL) cleanbm

docs/source/_libs/benchmark.py

0 → 100644

+158 −0

Original line number	Diff line number	Diff line
		import glob
		import multiprocessing
		import os
		import time
		import warnings
		from multiprocessing import Process
		from typing import Tuple, List

		import click
		import matplotlib.pyplot as plt
		import numpy as np
		import psutil
		from hbutils.scale import size_to_bytes_str
		from hbutils.string import ordinalize, plural_word
		from matplotlib.ticker import FuncFormatter
		from tqdm.auto import tqdm

		from conf import PROJ_DIR
		from plot import INCHES_TO_PIXELS

		_DEFAULT_IMAGE_POOL = glob.glob(os.path.join(PROJ_DIR, 'test', 'testfile', 'dataset', '*', '.jpg'), recursive=True)


		class BaseBenchmark:
		def __init__(self):
		self.all_images = _DEFAULT_IMAGE_POOL

		def load(self):
		raise NotImplementedError

		def unload(self):
		raise NotImplementedError

		def run(self):
		raise NotImplementedError

		def run_benchmark(self, run_times):
		logs = []
		current_process = psutil.Process()

		def _record(name):
		logs.append((name, current_process.memory_info().rss, time.time()))

		# make sure the model is downloaded
		self.load()
		self.unload()

		_record('<init>')

		self.load()
		_record('<load>')

		for i in tqdm(range(run_times)):
		self.run()
		_record(f'#{i + 1}')

		self.unload()
		_record('<unload>')

		mems = np.array([mem for _, mem, _ in logs])
		mems -= mems[0]
		times = np.array([time_ for _, _, time_ in logs])
		times -= times[0]
		times[1:] = times[1:] - times[:-1]
		labels = np.array([name for name, _, _ in logs])

		return mems, times, labels

		def _run_in_subprocess_share(self, run_times, ret):
		ret['retval'] = self.run_benchmark(run_times)

		def run_in_subprocess(self, run_times: int = 10, try_times: int = 10):
		manager = multiprocessing.Manager()
		full_deltas, full_times, final_labels = [], [], None
		for i in tqdm(range(try_times)):
		ret = manager.dict()
		p = Process(target=self._run_in_subprocess_share, args=(run_times, ret,))
		p.start()
		p.join()
		if p.exitcode != 0:
		raise ChildProcessError(f'Exitcode {p.exitcode} in {self!r}\'s {ordinalize(i + 1)} try.')

		mems, times, labels = ret['retval']
		deltas = mems[1:] - mems[:-1]
		full_deltas.append(deltas)
		full_times.append(times)
		if final_labels is None:
		final_labels = labels

		deltas = np.stack(full_deltas).mean(axis=0)
		final_mems = np.cumsum([0, *deltas])
		final_times = np.stack(full_times).mean(axis=0)

		return final_mems, final_times, final_labels


		def create_plot_cli(items: List[Tuple[str, BaseBenchmark]],
		title: str = 'Unnamed Benchmark Plot', run_times=15, try_times=10,
		mem_ylog: bool = False, time_ylog: bool = False,
		figsize=(720, 420), dpi: int = 300):
		def fmt_size(x, pos):
		_ = pos
		warnings.filterwarnings('ignore')
		return size_to_bytes_str(x, precision=1)

		def fmt_time(x, pos):
		_ = pos
		if x < 1e-6:
		return f'{x * 1e9:.1f}ns'
		elif x < 1e-3:
		return f'{x * 1e6:.1f}μs'
		elif x < 1:
		return f'{x * 1e3:.1f}ms'
		else:
		return f'{x * 1.0:.1f}s'

		@click.command()
		@click.option('--output', '-o', 'save_as', type=click.Path(dir_okay=False), required=True,
		help='Output path of image file.', show_default=True)
		def _execute(save_as):
		fig, axes = plt.subplots(1, 2, figsize=(figsize[0] / INCHES_TO_PIXELS, figsize[1] / INCHES_TO_PIXELS))

		if mem_ylog:
		axes[0].set_yscale('log')
		axes[0].yaxis.set_major_formatter(FuncFormatter(fmt_size))
		axes[0].set_title('Memory Benchmark')
		axes[0].set_ylabel('Memory Usage')

		if time_ylog:
		axes[1].set_yscale('log')
		axes[1].yaxis.set_major_formatter(FuncFormatter(fmt_time))
		axes[1].set_title('Performance Benchmark (CPU)')
		axes[1].set_ylabel('Time Cost')

		labeled = False

		for name, bm in tqdm(items):
		mems, times, labels = bm.run_in_subprocess(run_times, try_times)
		axes[0].plot(mems, label=name)
		axes[1].plot(times, label=name)
		if not labeled:
		axes[0].set_xticks(range(len(labels)), labels, rotation='vertical')
		axes[1].set_xticks(range(len(labels)), labels, rotation='vertical')
		labeled = True

		axes[0].legend()
		axes[0].grid()
		axes[1].legend()
		axes[1].grid()

		fig.suptitle(f'{title}\n'
		f'(Mean of {plural_word(try_times, "try")}, '
		f'run for {plural_word(run_times, "time")})')

		fig.tight_layout()
		plt.savefig(save_as, bbox_inches='tight', dpi=dpi, transparent=True)

		return _execute

docs/source/_libs/conf.py

0 → 100644

+3 −0

Original line number	Diff line number	Diff line
		import os

		PROJ_DIR = os.path.normpath(os.path.join(os.environ.get('PROJ_DIR'), '..'))

Original line number	Diff line number	Diff line
		@@ -1205,6 +1205,7 @@ fabric.properties
		/docs/source/*/.sh.err
		/docs/source/*/.sh.exitcode
		/docs/source/*/.dat.*
		!/docs/source/*/.benchmark.py.*
		!/docs/source/_static/*/
		/docs/source/*/.result.ipynb
		/cartpole_dqn_*