nlp-research / bilm-tf

bilm-tf for nlp-research
0 stars 1 forks source link

시스템4 성능 실험 #6

Open bart2001 opened 6 years ago

bart2001 commented 6 years ago

모델명: sejong_max_characters_per_token_4

options.json

{
 "all_clip_norm_val": 10.0,
 "batch_size": 128,
 "bidirectional": true,
 "char_cnn": {
  "activation": "relu",
  "embedding": {
   "dim": 16
  },
  "filters": [
   [
    1,
    32
   ],
   [
    2,
    32
   ],
   [
    3,
    64
   ],
   [
    4,
    128
   ]
  ],
  "max_characters_per_token": 4,
  "n_characters": 261,
  "n_highway": 2
 },
 "dropout": 0.1,
 "lstm": {
  "cell_clip": 3,
  "dim": 4096,
  "n_layers": 2,
  "proj_clip": 3,
  "projection_dim": 256,
  "use_skip_connections": true
 },
 "n_epochs": 10,
 "n_negative_samples_batch": 44,
 "n_tokens_vocab": 4488,
 "n_train_tokens": 32119740,
 "unroll_steps": 20
}
bart2001 commented 6 years ago

학습중