From 548ee210df79e9c74949b20be959a9fa418c1017 Mon Sep 17 00:00:00 2001 From: Andrej Karpathy Date: Sun, 21 Nov 2021 13:46:14 -0800 Subject: [PATCH] better default parameters, based on qualitative inspection of tfidf features and word vectors --- compute.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/compute.py b/compute.py index 5460455..a583c0b 100644 --- a/compute.py +++ b/compute.py @@ -17,9 +17,9 @@ from aslite.db import get_papers_db if __name__ == '__main__': parser = argparse.ArgumentParser(description='Arxiv Computor') - parser.add_argument('-n', '--num', type=int, default=10000, help='number of tfidf features') + parser.add_argument('-n', '--num', type=int, default=20000, help='number of tfidf features') parser.add_argument('--min_df', type=int, default=5, help='min df') - parser.add_argument('--max_df', type=float, default=0.5, help='max df') + parser.add_argument('--max_df', type=float, default=0.1, help='max df') args = parser.parse_args() print(args)