diff --git a/languedoc.py b/src/languedoc/train.py copy from languedoc.py copy to src/languedoc/train.py --- a/languedoc.py +++ b/src/languedoc/train.py @@ -4,7 +4,7 @@ import itertools import json import gzip -from shared import preprocess, identify, extract_ngram_freqs, rank_ngram_freqs, Sample +from predict import preprocess, identify, extract_ngram_freqs, rank_ngram_freqs, Sample random.seed(19181028) @@ -72,9 +72,9 @@ def cross_validate(sample_sets): return score / max_score, (score, max_score) -DATA_DIR = os.path.join(os.path.dirname(__file__), "data") +DATA_DIR = os.path.join(os.path.dirname(__file__), "../../data") LANG_DIRS = sorted([x.path for x in os.scandir(DATA_DIR)]) -MODEL_PATH = os.path.join(os.path.dirname(__file__), "models.json.gz") +MODEL_PATH = os.path.join(os.path.dirname(__file__), "../../models.json.gz") if __name__ == "__main__": samples = []