config.yml 1.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051
  1. language: zh
  2. pipeline:
  3. - name: JiebaTokenizer
  4. - name: LanguageModelFeaturizer
  5. model_name: bert
  6. model_weights: bert-base-chinese
  7. - name: RegexFeaturizer
  8. #- name: CRFEntityExtractor
  9. - name: LexicalSyntacticFeaturizer
  10. - name: CountVectorsFeaturizer
  11. - name: CountVectorsFeaturizer
  12. analyzer: char_wb
  13. min_ngram: 1
  14. max_ngram: 4
  15. - name: DIETClassifier
  16. entity_recognition: true
  17. intent_classification: true
  18. epochs: 400
  19. learning_rate: 0.0001
  20. ranking_length: 5
  21. - name: EntitySynonymMapper
  22. - name: RegexEntityExtractor
  23. use_word_boundaries: False #中文环境要用
  24. use_lookup_tables: True
  25. use_regexes: True
  26. - name: FallbackClassifier
  27. threshold: 0.3
  28. ambiguity_threshold: 0.1
  29. policies:
  30. - name: RulePolicy
  31. core_fallback_threshold: 0.3
  32. core_fallback_action_name: "action_default_fallback"
  33. enable_fallback_prediction: True
  34. - max_history: 6
  35. name: AugmentedMemoizationPolicy
  36. - name: TEDPolicy
  37. max_history: 10
  38. epochs: 40
  39. batch_size: 64
  40. embedding_dimension: 256
  41. attention_dimension: 128
  42. entity_recognition_model: "DIETClassifier"
  43. entity_recognition_embeddings: "sentence_transformers_all-MiniLM-L6-v2"
  44. - name: "MemoizationPolicy"
  45. - name: "RulePolicy"
  46. response_timeout: 120 # 以秒为单位
  47. action_execution_timeout: 120 # 以秒为单位