config-prompt.yaml 784 B

12345678910111213141516171819202122
  1. prompt:
  2. needle: "\nThe best thing to do in San Francisco is eat a sandwich and sit in Dolores Park on a sunny day.\n"
  3. haystack_dir: "data/PaulGrahamEssays"
  4. retrieval_question: "What is the best thing to do in San Francisco? Here is the most relevant sentence in the context:" # We use the Anthropic's retrieval question as the default one
  5. context:
  6. min_len: 1000
  7. max_len: 8000
  8. interval: 10
  9. manually_select_list: null # null or a list of context lengths to manually select
  10. document_depth:
  11. min_percent: 10
  12. max_percent: 90
  13. interval: 10
  14. interval_type: "linear" # "linear", "sigmoid" or null
  15. manually_select_list: null # null or a list of document percents to manually select
  16. tokenizer:
  17. tokenizer_type: "Huggingface"
  18. save_dir: 'data/needle_test/Huggingface'