__init__.py 2.61 KB
Newer Older
Pierre Dittgen's avatar
Pierre Dittgen committed
1
import json
Christophe Benz's avatar
Christophe Benz committed
2
import logging
3
import os
4
import re
5
from pathlib import Path
6
from urllib.parse import quote_plus
7

8
import cachecontrol
9 10
import flask
import jinja2
11 12 13
import requests
import tableschema

14
import opendataschema
15

16
from . import config
17

Christophe Benz's avatar
Christophe Benz committed
18 19
log = logging.getLogger(__name__)

20

21 22 23
def generate_schema_from_url_func(session):
    """Generates a function that encloses session"""

24 25 26 27 28
    def tableschema_from_url(url):
        response = session.get(url)
        response.raise_for_status()
        descriptor = response.json()
        return tableschema.Schema(descriptor)
29

30 31 32
    return tableschema_from_url


33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54
def is_http_url(ref) -> bool:
    return isinstance(ref, str) and re.match("https?://", ref)


class SchemaCatalogRegistry:
    """Retain section_name -> catalog url matching
    and creates SchemaCatalog instance on demand"""

    def __init__(self, session):
        self.session = session
        self.url_map = {}

    def add_ref(self, name, url):
        self.url_map[name] = url

    def build_schema_catalog(self, name):
        if name in self.url_map:
            catalog_url = self.url_map[name]
            return opendataschema.SchemaCatalog(catalog_url, session=self.session)
        return None


55 56
caching_session = cachecontrol.CacheControl(requests.Session())
tableschema_from_url = generate_schema_from_url_func(caching_session)
57

58
# And load schema catalogs which URLs are found in homepage_config.json
59
schema_catalog_registry = SchemaCatalogRegistry(caching_session)
60
if config.HOMEPAGE_CONFIG:
Christophe Benz's avatar
Christophe Benz committed
61
    log.info("Initializing homepage sections...")
62
    for section in config.HOMEPAGE_CONFIG['sections']:
Christophe Benz's avatar
Christophe Benz committed
63 64
        name = section['name']
        log.info('Initializing homepage section "{}"...'.format(name))
65 66 67
        catalog_ref = section.get('catalog')
        if is_http_url(catalog_ref):
            schema_catalog_registry.add_ref(name, catalog_ref)
68
    log.info("...done")
69 70

# Flask things
71
app = flask.Flask(__name__)
72 73
app.secret_key = config.SECRET_KEY

Christophe Benz's avatar
Christophe Benz committed
74 75 76 77 78
matomo = None
if config.MATOMO_AUTH_TOKEN and config.MATOMO_BASE_URL and config.MATOMO_SITE_ID:
    from flask_matomo import Matomo
    matomo = Matomo(app, matomo_url=config.MATOMO_BASE_URL,
                    id_site=config.MATOMO_SITE_ID, token_auth=config.MATOMO_AUTH_TOKEN)
79

80 81 82 83
# Jinja2 url_quote_plus custom filter
# https://stackoverflow.com/questions/12288454/how-to-import-custom-jinja2-filters-from-another-file-and-using-flask
blueprint = flask.Blueprint('filters', __name__)

84

85 86 87 88 89 90
@jinja2.contextfilter
@blueprint.app_template_filter()
def urlencode(context, value):
    return quote_plus(value)


91
# Keep this import after app initialisation (to avoid cyclic imports)
92
from . import views  # noqa isort:skip