site.py 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687
  1. import os
  2. from dotenv import load_dotenv
  3. from urllib.parse import quote
  4. from pydantic_settings import BaseSettings
  5. from typing import Dict, Union, Optional
  6. load_dotenv()
  7. class SiteConfig:
  8. def __init__(self):
  9. self.load_config()
  10. def load_config(self):
  11. self.config = {
  12. "SITE_NAME": os.getenv("SITE_NAME", "DEMO"),
  13. "SITE_DESCRIPTION": os.getenv("SITE_DESCRIPTION", "ChatGPT"),
  14. "SITE_URL": os.getenv("SITE_URL", ""),
  15. "SITE_LOGO": os.getenv("SITE_LOGO", ""),
  16. "SITE_FAVICON": os.getenv("SITE_FAVICON"),
  17. 'ELASTICSEARCH_HOST': os.getenv("ELASTICSEARCH_HOST"),
  18. 'ELASTICSEARCH_USER': os.getenv("ELASTICSEARCH_USER"),
  19. 'ELASTICSEARCH_PWD': os.getenv("ELASTICSEARCH_PWD"),
  20. 'WORD_INDEX': os.getenv("WORD_INDEX"),
  21. 'TITLE_INDEX': os.getenv("TITLE_INDEX"),
  22. 'CHUNC_INDEX': os.getenv("CHUNC_INDEX"),
  23. 'DEEPSEEK_API_URL': os.getenv("DEEPSEEK_API_URL"),
  24. 'DEEPSEEK_API_KEY': os.getenv("DEEPSEEK_API_KEY"),
  25. 'CACHED_DATA_PATH': os.getenv("CACHED_DATA_PATH"),
  26. 'UPDATE_DATA_PATH': os.getenv("UPDATE_DATA_PATH"),
  27. 'FACTOR_DATA_PATH': os.getenv("FACTOR_DATA_PATH"),
  28. 'GRAPH_API_URL': os.getenv("GRAPH_API_URL"),
  29. 'EMBEDDING_MODEL': os.getenv("EMBEDDING_MODEL"),
  30. 'DOC_PATH': os.getenv("DOC_PATH"),
  31. 'DOC_STORAGE_PATH': os.getenv("DOC_STORAGE_PATH"),
  32. 'TRUNC_OUTPUT_PATH': os.getenv("TRUNC_OUTPUT_PATH"),
  33. 'DOC_ABSTRACT_OUTPUT_PATH': os.getenv("DOC_ABSTRACT_OUTPUT_PATH"),
  34. 'JIEBA_USER_DICT': os.getenv("JIEBA_USER_DICT"),
  35. 'JIEBA_STOP_DICT': os.getenv("JIEBA_STOP_DICT"),
  36. 'POSTGRESQL_HOST': os.getenv("POSTGRESQL_HOST","localhost"),
  37. 'POSTGRESQL_DATABASE': os.getenv("POSTGRESQL_DATABASE","kg"),
  38. 'POSTGRESQL_USER': os.getenv("POSTGRESQL_USER","dify"),
  39. 'POSTGRESQL_PASSWORD': os.getenv("POSTGRESQL_PASSWORD",quote("difyai123456")),
  40. 'JOB_PATH': os.getenv("JOB_PATH","/app/agent/jobs"),
  41. }
  42. def get_config(self, config_name, default=None):
  43. config_name = config_name.upper()
  44. value = os.getenv(config_name, None)
  45. if value:
  46. return value
  47. if config_name in self.config:
  48. return self.config[config_name]
  49. else:
  50. return default
  51. def check_config(self, config_list):
  52. for item in config_list:
  53. if not self.get_config(item):
  54. raise ValueError(f"Configuration '{item}' is not set.")
  55. class Settings(BaseSettings):
  56. # PostgreSQL配置
  57. DATABASE_URL: str = "postgresql://knowledge:qwer1234.@173.18.12.203:5432/knowledge_base"
  58. # MinIO配置
  59. MINIO_ENDPOINT: str = "173.18.12.199:9000"
  60. MINIO_ACCESS_KEY: str = "yvhNcezRwQvPuUylHqrg"
  61. MINIO_SECRET_KEY: str = "QQCejGeENpUIkGr4yfDaubPwWCoV29xHoXv6gHYU"
  62. MINIO_BUCKET_NAME: str = "knowledge-base"
  63. MINIO_SECURE: bool = False
  64. # 文件上传配置
  65. MAX_FILE_COUNT: int = 100
  66. ALLOWED_EXTENSIONS: Dict[str, Dict[str, Union[int, Optional[int]]]] = {
  67. "doc": {"max_size": 50, "max_pages": 1000},
  68. "txt": {"max_size": 10, "max_pages": None},
  69. "docx": {"max_size": 50, "max_pages": 1000},
  70. "pdf": {"max_size": 500, "max_pages": 3000},
  71. "ppt": {"max_size": 50, "max_pages": 1000},
  72. "pptx": {"max_size": 50, "max_pages": 1000},
  73. "md": {"max_size": 10, "max_pages": None}
  74. }
  75. settings = Settings()