context.pbtxt 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157
  1. Parameter {
  2. name: 'brain_parser_embedding_dims'
  3. value: '64;32;32'
  4. }
  5. Parameter {
  6. name: 'brain_parser_features'
  7. value: 'input.word input(1).word input(2).word input(3).word stack.word stack(1).word stack(2).word stack(3).word stack.child(1).word stack.child(1).sibling(-1).word stack.child(-1).word stack.child(-1).sibling(1).word stack(1).child(1).word stack(1).child(1).sibling(-1).word stack(1).child(-1).word stack(1).child(-1).sibling(1).word stack.child(2).word stack.child(-2).word stack(1).child(2).word stack(1).child(-2).word;input.tag input(1).tag input(2).tag input(3).tag stack.tag stack(1).tag stack(2).tag stack(3).tag stack.child(1).tag stack.child(1).sibling(-1).tag stack.child(-1).tag stack.child(-1).sibling(1).tag stack(1).child(1).tag stack(1).child(1).sibling(-1).tag stack(1).child(-1).tag stack(1).child(-1).sibling(1).tag stack.child(2).tag stack.child(-2).tag stack(1).child(2).tag stack(1).child(-2).tag;stack.child(1).label stack.child(1).sibling(-1).label stack.child(-1).label stack.child(-1).sibling(1).label stack(1).child(1).label stack(1).child(1).sibling(-1).label stack(1).child(-1).label stack(1).child(-1).sibling(1).label stack.child(2).label stack.child(-2).label stack(1).child(2).label stack(1).child(-2).label'
  8. }
  9. Parameter {
  10. name: 'brain_parser_embedding_names'
  11. value: 'words;tags;labels'
  12. }
  13. Parameter {
  14. name: 'brain_parser_scoring'
  15. value: 'default'
  16. }
  17. Parameter {
  18. name: 'brain_pos_transition_system'
  19. value: 'tagger'
  20. }
  21. Parameter {
  22. name: 'brain_pos_embedding_dims'
  23. value: '64;4;8;8'
  24. }
  25. Parameter {
  26. name: 'brain_pos_features'
  27. value: 'stack(3).word stack(2).word stack(1).word stack.word input.word input(1).word input(2).word input(3).word;input.digit input.hyphen;stack.suffix(length=2) input.suffix(length=2) input(1).suffix(length=2);stack.prefix(length=2) input.prefix(length=2) input(1).prefix(length=2)'
  28. }
  29. Parameter {
  30. name: 'brain_pos_embedding_names'
  31. value: 'words;other;suffix;prefix'
  32. }
  33. input {
  34. name: 'training-corpus'
  35. record_format: 'conll-sentence'
  36. Part {
  37. file_pattern: '<your-dataset>/treebank-train.trees.conll'
  38. }
  39. }
  40. input {
  41. name: 'tuning-corpus'
  42. record_format: 'conll-sentence'
  43. Part {
  44. file_pattern: '<your-dataset>/dev.conll'
  45. }
  46. }
  47. input {
  48. name: 'dev-corpus'
  49. record_format: 'conll-sentence'
  50. Part {
  51. file_pattern: '<your-dataset>/test.conll'
  52. }
  53. }
  54. input {
  55. name: 'tagged-training-corpus'
  56. creator: 'brain_pos/greedy'
  57. record_format: 'conll-sentence'
  58. }
  59. input {
  60. name: 'tagged-tuning-corpus'
  61. creator: 'brain_pos/greedy'
  62. record_format: 'conll-sentence'
  63. }
  64. input {
  65. name: 'tagged-dev-corpus'
  66. creator: 'brain_pos/greedy'
  67. record_format: 'conll-sentence'
  68. }
  69. input {
  70. name: 'label-map'
  71. creator: 'brain_pos/greedy'
  72. }
  73. input {
  74. name: 'word-map'
  75. creator: 'brain_pos/greedy'
  76. }
  77. input {
  78. name: 'lcword-map'
  79. creator: 'brain_pos/greedy'
  80. }
  81. input {
  82. name: 'tag-map'
  83. creator: 'brain_pos/greedy'
  84. }
  85. input {
  86. name: 'category-map'
  87. creator: 'brain_pos/greedy'
  88. }
  89. input {
  90. name: 'prefix-table'
  91. creator: 'brain_pos/greedy'
  92. }
  93. input {
  94. name: 'suffix-table'
  95. creator: 'brain_pos/greedy'
  96. }
  97. input {
  98. name: 'tag-to-category'
  99. creator: 'brain_pos/greedy'
  100. }
  101. input {
  102. name: 'projectivized-training-corpus'
  103. creator: 'brain_parser/greedy'
  104. record_format: 'conll-sentence'
  105. }
  106. input {
  107. name: 'parsed-training-corpus'
  108. creator: 'brain_parser/greedy'
  109. record_format: 'conll-sentence'
  110. }
  111. input {
  112. name: 'parsed-tuning-corpus'
  113. creator: 'brain_parser/greedy'
  114. record_format: 'conll-sentence'
  115. }
  116. input {
  117. name: 'parsed-dev-corpus'
  118. creator: 'brain_parser/greedy'
  119. record_format: 'conll-sentence'
  120. }
  121. input {
  122. name: 'beam-parsed-training-corpus'
  123. creator: 'brain_parser/structured'
  124. record_format: 'conll-sentence'
  125. }
  126. input {
  127. name: 'beam-parsed-tuning-corpus'
  128. creator: 'brain_parser/structured'
  129. record_format: 'conll-sentence'
  130. }
  131. input {
  132. name: 'beam-parsed-dev-corpus'
  133. creator: 'brain_parser/structured'
  134. record_format: 'conll-sentence'
  135. }
  136. input {
  137. name: 'stdin'
  138. record_format: 'english-text'
  139. Part {
  140. file_pattern: '-'
  141. }
  142. }
  143. input {
  144. name: 'stdin-conll'
  145. record_format: 'conll-sentence'
  146. Part {
  147. file_pattern: '-'
  148. }
  149. }
  150. input {
  151. name: 'stdout-conll'
  152. record_format: 'conll-sentence'
  153. Part {
  154. file_pattern: '-'
  155. }
  156. }