You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

hparams.py 3.0 kB

4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263
  1. import argparse
  2. class Hparams:
  3. parser = argparse.ArgumentParser()
  4. # prepro
  5. parser.add_argument('--vocab_size', default=32000, type=int)
  6. # train
  7. # files
  8. parser.add_argument('--train1', default='iwslt2016/segmented/train.de.bpe',
  9. help="german training segmented data")
  10. parser.add_argument('--train2', default='iwslt2016/segmented/train.en.bpe',
  11. help="english training segmented data")
  12. parser.add_argument('--eval1', default='iwslt2016/segmented/eval.de.bpe',
  13. help="german evaluation segmented data")
  14. parser.add_argument('--eval2', default='iwslt2016/segmented/eval.en.bpe',
  15. help="english evaluation segmented data")
  16. parser.add_argument('--eval3', default='iwslt2016/prepro/eval.en',
  17. help="english evaluation unsegmented data")
  18. # vocabulary
  19. parser.add_argument('--vocab', default='iwslt2016/segmented/bpe.vocab',
  20. help="vocabulary file path")
  21. # training scheme
  22. parser.add_argument('--batch_size', default=16, type=int)
  23. parser.add_argument('--eval_batch_size', default=128, type=int)
  24. parser.add_argument('--lr', default=0.0003,
  25. type=float, help="learning rate")
  26. parser.add_argument('--warmup_steps', default=4000, type=int)
  27. parser.add_argument('--logdir', default="logs/tf", help="log directory")
  28. parser.add_argument('--num_epochs', default=20, type=int)
  29. parser.add_argument('--evaldir', default="logs/tf/eval",
  30. help="evaluation dir")
  31. # model
  32. parser.add_argument('--d_model', default=512, type=int,
  33. help="hidden dimension of encoder/decoder")
  34. parser.add_argument('--d_ff', default=2048, type=int,
  35. help="hidden dimension of feedforward layer")
  36. parser.add_argument('--num_blocks', default=6, type=int,
  37. help="number of encoder/decoder blocks")
  38. parser.add_argument('--num_heads', default=8, type=int,
  39. help="number of attention heads")
  40. parser.add_argument('--maxlen1', default=100, type=int,
  41. help="maximum length of a source sequence")
  42. parser.add_argument('--maxlen2', default=100, type=int,
  43. help="maximum length of a target sequence")
  44. parser.add_argument('--dropout_rate', default=0.3, type=float)
  45. parser.add_argument('--smoothing', default=0.1, type=float,
  46. help="label smoothing rate")
  47. # test
  48. parser.add_argument('--test1', default='iwslt2016/segmented/test.de.bpe',
  49. help="german test segmented data")
  50. parser.add_argument('--test2', default='iwslt2016/prepro/test.en',
  51. help="english test data")
  52. parser.add_argument('--ckpt', help="checkpoint file path")
  53. parser.add_argument('--test_batch_size', default=128, type=int)
  54. parser.add_argument('--testdir', default="test/1", help="test result dir")