context.pbtxt 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161
  1. Parameter {
  2. name: 'brain_parser_embedding_dims'
  3. value: '64;32;32'
  4. }
  5. Parameter {
  6. name: 'brain_parser_features'
  7. value: 'input.word input(1).word input(2).word input(3).word stack.word stack(1).word stack(2).word stack(3).word stack.child(1).word stack.child(1).sibling(-1).word stack.child(-1).word stack.child(-1).sibling(1).word stack(1).child(1).word stack(1).child(1).sibling(-1).word stack(1).child(-1).word stack(1).child(-1).sibling(1).word stack.child(2).word stack.child(-2).word stack(1).child(2).word stack(1).child(-2).word;input.tag input(1).tag input(2).tag input(3).tag stack.tag stack(1).tag stack(2).tag stack(3).tag stack.child(1).tag stack.child(1).sibling(-1).tag stack.child(-1).tag stack.child(-1).sibling(1).tag stack(1).child(1).tag stack(1).child(1).sibling(-1).tag stack(1).child(-1).tag stack(1).child(-1).sibling(1).tag stack.child(2).tag stack.child(-2).tag stack(1).child(2).tag stack(1).child(-2).tag;stack.child(1).label stack.child(1).sibling(-1).label stack.child(-1).label stack.child(-1).sibling(1).label stack(1).child(1).label stack(1).child(1).sibling(-1).label stack(1).child(-1).label stack(1).child(-1).sibling(1).label stack.child(2).label stack.child(-2).label stack(1).child(2).label stack(1).child(-2).label'
  8. }
  9. Parameter {
  10. name: 'brain_parser_embedding_names'
  11. value: 'words;tags;labels'
  12. }
  13. Parameter {
  14. name: 'brain_parser_scoring'
  15. value: 'default'
  16. }
  17. Parameter {
  18. name: 'brain_pos_transition_system'
  19. value: 'tagger'
  20. }
  21. Parameter {
  22. name: 'brain_pos_embedding_dims'
  23. value: '64;4;8;8'
  24. }
  25. Parameter {
  26. name: 'brain_pos_features'
  27. value: 'stack(3).word stack(2).word stack(1).word stack.word input.word input(1).word input(2).word input(3).word;input.digit input.hyphen;stack.suffix(length=2) input.suffix(length=2) input(1).suffix(length=2);stack.prefix(length=2) input.prefix(length=2) input(1).prefix(length=2)'
  28. }
  29. Parameter {
  30. name: 'brain_pos_embedding_names'
  31. value: 'words;other;suffix;prefix'
  32. }
  33. input {
  34. name: 'training-corpus'
  35. record_format: 'conll-sentence'
  36. Part {
  37. file_pattern: '<your-dataset>/treebank-train.trees.conll'
  38. }
  39. }
  40. input {
  41. name: 'tuning-corpus'
  42. record_format: 'conll-sentence'
  43. Part {
  44. file_pattern: '<your-dataset>/dev.conll'
  45. }
  46. }
  47. input {
  48. name: 'dev-corpus'
  49. record_format: 'conll-sentence'
  50. Part {
  51. file_pattern: '<your-dataset>/test.conll'
  52. }
  53. }
  54. input {
  55. name: 'tagged-training-corpus'
  56. creator: 'brain_pos/greedy'
  57. record_format: 'conll-sentence'
  58. }
  59. input {
  60. name: 'tagged-tuning-corpus'
  61. creator: 'brain_pos/greedy'
  62. record_format: 'conll-sentence'
  63. }
  64. input {
  65. name: 'tagged-dev-corpus'
  66. creator: 'brain_pos/greedy'
  67. record_format: 'conll-sentence'
  68. }
  69. input {
  70. name: 'label-map'
  71. creator: 'brain_pos/greedy'
  72. }
  73. input {
  74. name: 'word-map'
  75. creator: 'brain_pos/greedy'
  76. }
  77. input {
  78. name: 'lcword-map'
  79. creator: 'brain_pos/greedy'
  80. }
  81. input {
  82. name: 'tag-map'
  83. creator: 'brain_pos/greedy'
  84. }
  85. input {
  86. name: 'category-map'
  87. creator: 'brain_pos/greedy'
  88. }
  89. input {
  90. name: 'char-map'
  91. creator: 'brain_pos/greedy'
  92. }
  93. input {
  94. name: 'prefix-table'
  95. creator: 'brain_pos/greedy'
  96. }
  97. input {
  98. name: 'suffix-table'
  99. creator: 'brain_pos/greedy'
  100. }
  101. input {
  102. name: 'tag-to-category'
  103. creator: 'brain_pos/greedy'
  104. }
  105. input {
  106. name: 'projectivized-training-corpus'
  107. creator: 'brain_parser/greedy'
  108. record_format: 'conll-sentence'
  109. }
  110. input {
  111. name: 'parsed-training-corpus'
  112. creator: 'brain_parser/greedy'
  113. record_format: 'conll-sentence'
  114. }
  115. input {
  116. name: 'parsed-tuning-corpus'
  117. creator: 'brain_parser/greedy'
  118. record_format: 'conll-sentence'
  119. }
  120. input {
  121. name: 'parsed-dev-corpus'
  122. creator: 'brain_parser/greedy'
  123. record_format: 'conll-sentence'
  124. }
  125. input {
  126. name: 'beam-parsed-training-corpus'
  127. creator: 'brain_parser/structured'
  128. record_format: 'conll-sentence'
  129. }
  130. input {
  131. name: 'beam-parsed-tuning-corpus'
  132. creator: 'brain_parser/structured'
  133. record_format: 'conll-sentence'
  134. }
  135. input {
  136. name: 'beam-parsed-dev-corpus'
  137. creator: 'brain_parser/structured'
  138. record_format: 'conll-sentence'
  139. }
  140. input {
  141. name: 'stdin'
  142. record_format: 'english-text'
  143. Part {
  144. file_pattern: '-'
  145. }
  146. }
  147. input {
  148. name: 'stdin-conll'
  149. record_format: 'conll-sentence'
  150. Part {
  151. file_pattern: '-'
  152. }
  153. }
  154. input {
  155. name: 'stdout-conll'
  156. record_format: 'conll-sentence'
  157. Part {
  158. file_pattern: '-'
  159. }
  160. }