Add pre-process invoke task & rename data source files
This commit is contained in:
parent
2cc87d878f
commit
b2bc5e0d1c
4 changed files with 22 additions and 3 deletions
Can't render this file because it is too large.
|
25
tasks.py
25
tasks.py
|
@ -1,3 +1,4 @@
|
||||||
|
import re
|
||||||
from concurrent.futures import ThreadPoolExecutor
|
from concurrent.futures import ThreadPoolExecutor
|
||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
|
|
||||||
|
@ -17,6 +18,7 @@ TARGETS = [
|
||||||
"windows/amd64",
|
"windows/amd64",
|
||||||
"windows/arm",
|
"windows/arm",
|
||||||
]
|
]
|
||||||
|
BASE_DIR = Path(__file__).parent.resolve(strict=True)
|
||||||
|
|
||||||
|
|
||||||
@task
|
@task
|
||||||
|
@ -36,12 +38,29 @@ def build(context, version_name):
|
||||||
binary_name = f"insee-{version_name}-{os}-{arch}"
|
binary_name = f"insee-{version_name}-{os}-{arch}"
|
||||||
if os == "windows":
|
if os == "windows":
|
||||||
binary_name += ".exe"
|
binary_name += ".exe"
|
||||||
binary_path = (
|
binary_path = BASE_DIR / "dist" / binary_name
|
||||||
Path(__file__).resolve(strict=True).parent / "dist" / binary_name
|
|
||||||
)
|
|
||||||
pool.submit(
|
pool.submit(
|
||||||
context.run,
|
context.run,
|
||||||
f"go build -o {binary_path}",
|
f"go build -o {binary_path}",
|
||||||
env={"GOOS": os, "GOARCH": arch},
|
env={"GOOS": os, "GOARCH": arch},
|
||||||
echo=True,
|
echo=True,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
|
@task
|
||||||
|
def pre_process(context):
|
||||||
|
"""Pre-process raw data into JSON"""
|
||||||
|
files_to_rename = {
|
||||||
|
r"commune.*\.csv": "commune.csv",
|
||||||
|
r"departement.*\.csv": "departement.csv",
|
||||||
|
r"pays.*\.csv": "pays.csv",
|
||||||
|
}
|
||||||
|
raw_data_dir = BASE_DIR / "data" / "raw_data"
|
||||||
|
for file in raw_data_dir.iterdir():
|
||||||
|
for reg, target_name in files_to_rename.items():
|
||||||
|
reg = re.compile(reg)
|
||||||
|
if reg.match(file.name):
|
||||||
|
file.rename(raw_data_dir / target_name)
|
||||||
|
|
||||||
|
with context.cd(BASE_DIR):
|
||||||
|
context.run("go run ./pre_process")
|
||||||
|
|
Loading…
Reference in a new issue