wcs-olap: build a start schema from data exported by w.c.s. API

Given such an .INI file:

	[https://demarches.triffouilly.fr/]
	orig = bi.triffouilly.fr
	key = 452b8964
	pg_dsn = dbname=publik-bi
	email = bi@entrouvert.com
	schema = triffouilly
	# slugs = recette-technique-ajout-d-un-enfant

It builds a schema named 'triffouilly' in the pre-existing database named 'publik-bi', the schema will contains tables named:

    channel (label varchar)
    role (label varchar)
    category (label varchar)
    form (category, label)
    formdata : parent table of all formdata tables)
        (form, receipt_time, year, month, dow, hour, channel, backoffice, generic_status)
    status (generic statuses: new, in progress & closed
        label

    for each formdef tables named:

       formdata_{formdef.slug}
       status_{formdef.slug}

       for each anonymisable
This commit is contained in:
Benjamin Dauvergne 2016-05-10 16:53:17 +02:00
parent b6b28a96cd
commit cb206893cd
2 changed files with 84 additions and 0 deletions

23
README.rst Normal file
View File

@ -0,0 +1,23 @@
BI for Publik
=============
w.c.s. OLAP
-----------
Tool to export w.c.s. data in a database with star schema for making an OLAP
cube.::
usage: wcs-olap --url URL [-h] --orig ORIG --key KEY
--pg-dsn PG_DSN
Export W.C.S. data as a star schema in a postgresql DB
optional arguments:
--url URL url of the w.c.s. instance
-h, --help show this help message and exit
--orig ORIG origin of the request for signatures
--key KEY HMAC key for signatures
--pg-dsn PG_DSN Psycopg2 DB DSN

61
setup.py Normal file
View File

@ -0,0 +1,61 @@
#! /usr/bin/env python
import subprocess
import os
from setuptools import setup, find_packages
from setuptools.command.sdist import sdist
class eo_sdist(sdist):
def run(self):
print "creating VERSION file"
if os.path.exists('VERSION'):
os.remove('VERSION')
version = get_version()
version_file = open('VERSION', 'w')
version_file.write(version)
version_file.close()
sdist.run(self)
print "removing VERSION file"
if os.path.exists('VERSION'):
os.remove('VERSION')
def get_version():
'''Use the VERSION, if absent generates a version with git describe, if not
tag exists, take 0.0.0- and add the length of the commit log.
'''
if os.path.exists('VERSION'):
with open('VERSION', 'r') as v:
return v.read()
if os.path.exists('.git'):
p = subprocess.Popen(['git', 'describe', '--dirty', '--match=v*'], stdout=subprocess.PIPE,
stderr=subprocess.PIPE)
result = p.communicate()[0]
if p.returncode == 0:
result = result.split()[0][1:]
else:
result = '0.0.0-%s' % len(subprocess.check_output(
['git', 'rev-list', 'HEAD']).splitlines())
return result.replace('-', '.').replace('.g', '+g')
return '0.0.0'
setup(name="wcs-olap",
version=get_version(),
license="AGPLv3+",
description="Export w.c.s. data to an OLAP cube",
long_description=open('README.rst').read(),
url="http://dev.entrouvert.org/projects/publik-bi/",
author="Entr'ouvert",
author_email="authentic@listes.entrouvert.com",
maintainer="Benjamin Dauvergne",
maintainer_email="bdauvergne@entrouvert.com",
packages=find_packages(),
include_package_data=True,
install_requires=['requests','psycopg2', 'isodate'],
entry_points={
'console_scripts': ['wcs-olap=wcs_olap.cmd:main'],
},
cmdclass={'sdist': eo_sdist})