Petr Tsvetkov
WIP on annotated diffs generation
aab3281
raw
history blame
343 Bytes
import os
from pathlib import Path
HF_TOKEN = os.environ.get('HF_TOKEN')
HF_RAW_DATASET_NAME = "petrtsv-jb/commit-msg-rewriting"
HF_RAW_DATASET_SPLIT = 'train'
CACHE_DIR = Path("cache")
CACHE_DIR.mkdir(exist_ok=True)
OUTPUT_DIR = Path("output")
OUTPUT_DIR.mkdir(exist_ok=True)
ANNOTATED_DIFFS_ARTIFACT = OUTPUT_DIR / "annotated_diffs.csv"