APP_TITLE = env.get('ALEPH_APP_TITLE', lazy_gettext('Aleph')) APP_DESCRIPTION = env.get('ALEPH_APP_DESCRIPTION', '') APP_NAME = env.get('ALEPH_APP_NAME', 'aleph') APP_UI_URL = env.get('ALEPH_UI_URL', 'http://localhost:8080/') APP_LOGO = env.get('ALEPH_LOGO', '/static/logo.png') APP_FAVICON = env.get('ALEPH_FAVICON', '/static/logo.png') # Show a system-wide banner in the user interface. APP_BANNER = env.get('ALEPH_APP_BANNER') # Force HTTPS here: URL_SCHEME = env.get('ALEPH_URL_SCHEME', 'http') # Shown on the home page as a few sample queries: SAMPLE_SEARCHES = [lazy_gettext('TeliaSonera'), lazy_gettext('Vladimir Putin')] SAMPLE_SEARCHES = env.to_list('ALEPH_SAMPLE_SEARCHES', SAMPLE_SEARCHES) # Cross-origin resource sharing CORS_ORIGINS = env.to_list('ALEPH_CORS_ORIGINS', separator='|') ############################################################################### # Data storage # Archive type (either 's3' or 'file', i.e. local file system): ARCHIVE_TYPE = env.get('ALEPH_ARCHIVE_TYPE', sls.ARCHIVE_TYPE) ARCHIVE_BUCKET = env.get('ALEPH_ARCHIVE_BUCKET', sls.ARCHIVE_BUCKET) ARCHIVE_PATH = env.get('ALEPH_ARCHIVE_PATH', sls.ARCHIVE_PATH) ############################################################################## # Security and authentication.
############################################################################### # General instance information APP_TITLE = env.get('ALEPH_APP_TITLE', lazy_gettext('Aleph')) APP_DESCRIPTION = env.get('ALEPH_APP_DESCRIPTION', '') APP_NAME = env.get('ALEPH_APP_NAME', 'aleph') APP_UI_URL = env.get('ALEPH_UI_URL', 'http://localhost:8080/') APP_LOGO = env.get('ALEPH_LOGO', '/static/logo.png') APP_FAVICON = env.get('ALEPH_FAVICON', '/static/favicon.png') # Show a system-wide banner in the user interface. APP_BANNER = env.get('ALEPH_APP_BANNER') # Shown on the home page as a few sample queries: SAMPLE_SEARCHES = [lazy_gettext('TeliaSonera'), lazy_gettext('Vladimir Putin')] SAMPLE_SEARCHES = env.to_list('ALEPH_SAMPLE_SEARCHES', SAMPLE_SEARCHES) # Force HTTPS here: FORCE_HTTPS = env.to_bool('ALEPH_FORCE_HTTPS', False) # Content security policy: CONTENT_POLICY = 'default-src: \'self\' \'unsafe-inline\' \'unsafe-eval\' data: *' # noqa CONTENT_POLICY = env.get('ALEPH_CONTENT_POLICY', CONTENT_POLICY) # Cross-origin resource sharing CORS_ORIGINS = env.to_list('ALEPH_CORS_ORIGINS', ['*'], separator='|') ############################################################################## # Security and authentication. # Required: set a secret key
CONVERT_URL = env.get("UNOSERVICE_URL", "http://convert-document:3000/convert") CONVERT_URL = env.get("INGESTORS_CONVERT_DOCUMENT_URL", CONVERT_URL) CONVERT_TIMEOUT = env.to_int("INGESTORS_CONVERT_TIMEOUT", 7200) # 2 hrs CONVERT_RETRIES = env.to_int("INGESTORS_CONVERT_RETRIES", 256) # Enable (expensive!) Google Cloud API OCR_VISION_API = env.to_bool("INGESTORS_OCR_VISION_API", False) # Geonames data file GEONAMES_PATH = env.get("INGESTORS_GEONAMES_PATH", "/ingestors/data/geonames.txt") # FastText lid model file LID_MODEL_PATH = env.get("INGESTORS_LID_MODEL_PATH", "/ingestors/data/lid.176.ftz") # Disable entity extraction ANALYZE_ENTITIES = env.to_bool("INGESTORS_ANALYZE_ENTITIES", True) # List available NER models NER_MODELS = set(env.to_list("INGESTORS_NER_MODELS", ["eng"])) NER_DISABLE = ["ara"] NER_DISABLE = set(env.to_list("INGESTORS_NER_DISABLE", NER_DISABLE)) NER_DEFAULT_MODEL = "xx" # Use the environment variable set in aleph.env sts.DATABASE_URI = env.get("ALEPH_DATABASE_URI", sts.DATABASE_URI) # Also store cached values in the SQL database sls.TAGS_DATABASE_URI = sts.DATABASE_URI
# Force HTTPS here: FORCE_HTTPS = True if APP_UI_URL.lower().startswith("https") else False FORCE_HTTPS = env.to_bool("ALEPH_FORCE_HTTPS", FORCE_HTTPS) PREFERRED_URL_SCHEME = "https" if FORCE_HTTPS else "http" PREFERRED_URL_SCHEME = env.get("ALEPH_URL_SCHEME", PREFERRED_URL_SCHEME) # Apply HTTPS rules to the UI URL: APP_PARSED_UI_URL = urlparse(APP_UI_URL)._replace(scheme=PREFERRED_URL_SCHEME) APP_UI_URL = APP_PARSED_UI_URL.geturl() # Content security policy: CONTENT_POLICY = "default-src: 'self' 'unsafe-inline' 'unsafe-eval' data: *" CONTENT_POLICY = env.get("ALEPH_CONTENT_POLICY", CONTENT_POLICY) # Cross-origin resource sharing CORS_ORIGINS = env.to_list("ALEPH_CORS_ORIGINS", ["*"], separator="|") ############################################################################## # Security and authentication. # Required: set a secret key SECRET_KEY = env.get("ALEPH_SECRET_KEY") # Designate users with the given email as admins automatically: # Assumes a comma-separated list. ADMINS = env.to_list("ALEPH_ADMINS") # Set the foreign ID of the default system user. SYSTEM_USER = env.get("ALEPH_SYSTEM_USER", "system:aleph") # Configure your OAUTH login provider, providing the details as described in
TESTING = False # Document conversion service CONVERT_URL = env.get('UNOSERVICE_URL', 'http://convert-document:3000/convert') CONVERT_URL = env.get('INGESTORS_CONVERT_DOCUMENT_URL', CONVERT_URL) CONVERT_TIMEOUT = env.to_int('INGESTORS_CONVERT_TIMEOUT', 7200) # 2 hrs # Enable (expensive!) Google Cloud API OCR_VISION_API = env.to_bool('INGESTORS_OCR_VISION_API', False) # Geonames data file GEONAMES_PATH = env.get('INGESTORS_GEONAMES_PATH', '/ingestors/data/geonames.txt') # FastText lid model file LID_MODEL_PATH = env.get('INGESTORS_LID_MODEL_PATH', '/ingestors/data/lid.176.ftz') # Disable entity extraction ANALYZE_ENTITIES = env.to_bool('INGESTORS_ANALYZE_ENTITIES', True) # List available NER models NER_MODELS = set(env.to_list('INGESTORS_NER_MODELS', ['eng'])) NER_DEFAULT_MODEL = 'xx' # Use the environment variable set in aleph.env sts.DATABASE_URI = env.get('ALEPH_DATABASE_URI', sts.DATABASE_URI) # Also store cached values in the SQL database sls.TAGS_DATABASE_URI = sts.DATABASE_URI
TESTING = False # Document conversion service CONVERT_URL = env.get("UNOSERVICE_URL", "http://convert-document:3000/convert") CONVERT_URL = env.get("INGESTORS_CONVERT_DOCUMENT_URL", CONVERT_URL) CONVERT_TIMEOUT = env.to_int("INGESTORS_CONVERT_TIMEOUT", 7200) # 2 hrs # Enable (expensive!) Google Cloud API OCR_VISION_API = env.to_bool("INGESTORS_OCR_VISION_API", False) # Geonames data file GEONAMES_PATH = env.get("INGESTORS_GEONAMES_PATH", "/ingestors/data/geonames.txt") # FastText lid model file LID_MODEL_PATH = env.get("INGESTORS_LID_MODEL_PATH", "/ingestors/data/lid.176.ftz") # Disable entity extraction ANALYZE_ENTITIES = env.to_bool("INGESTORS_ANALYZE_ENTITIES", True) # List available NER models NER_MODELS = set(env.to_list("INGESTORS_NER_MODELS", ["eng"])) NER_DEFAULT_MODEL = "xx" # Use the environment variable set in aleph.env sts.DATABASE_URI = env.get("ALEPH_DATABASE_URI", sts.DATABASE_URI) # Also store cached values in the SQL database sls.TAGS_DATABASE_URI = sts.DATABASE_URI
DEBUGPY_WAIT_FOR_CLIENT = env.to_bool("INGESTORS_DEBUGPY_WAIT_FOR_CLIENT", False) # Document conversion service CONVERT_URL = env.get("UNOSERVICE_URL", "http://convert-document:3000/convert") CONVERT_URL = env.get("INGESTORS_CONVERT_DOCUMENT_URL", CONVERT_URL) CONVERT_TIMEOUT = env.to_int("INGESTORS_CONVERT_TIMEOUT", 7200) # 2 hrs # Enable (expensive!) Google Cloud API OCR_VISION_API = env.to_bool("INGESTORS_OCR_VISION_API", False) # Enable Google Cloud Translation API TRANSLATION_API = env.to_bool("INGESTORS_TRANSLATION_API", False) # White list of language IDs for languages that should be translated # An empty white list is considered a wildcard, allowing all languages to be translated TRANSLATION_LANGUAGE_WHITE_LIST = env.to_list("INGESTORS_TRANSLATION_LANGUAGE_WHITE_LIST", None) # Black list of language IDs for languages that should NOT be translated # An empty black list means that no languages are restricted # The black list takes precedence over the white list TRANSLATION_LANGUAGE_BLACK_LIST = env.to_list("INGESTORS_TRANSLATION_LANGUAGE_BLACK_LIST", ["en", "eng"]) # Geonames data file GEONAMES_PATH = env.get("INGESTORS_GEONAMES_PATH", "/ingestors/data/geonames.txt") # FastText lid model file LID_MODEL_PATH = env.get("INGESTORS_LID_MODEL_PATH", "/ingestors/data/lid.176.ftz") # Disable entity extraction ANALYZE_ENTITIES = env.to_bool("INGESTORS_ANALYZE_ENTITIES", True)