123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141 |
- """Loads datasets, dashboards and slices in a new superset instance"""
- import textwrap
- import pandas as pd
- from sqlalchemy import Float, String
- from sqlalchemy.sql import column
- from superset import db
- from superset.connectors.sqla.models import SqlMetric
- from superset.models.slice import Slice
- from superset.utils import core as utils
- from .helpers import get_example_data, merge_slice, misc_dash_slices, TBL
- def load_energy(only_metadata: bool = False, force: bool = False) -> None:
- """Loads an energy related dataset to use with sankey and graphs"""
- tbl_name = "energy_usage"
- database = utils.get_example_database()
- table_exists = database.has_table_by_name(tbl_name)
- if not only_metadata and (not table_exists or force):
- data = get_example_data("energy.json.gz")
- pdf = pd.read_json(data)
- pdf.to_sql(
- tbl_name,
- database.get_sqla_engine(),
- if_exists="replace",
- chunksize=500,
- dtype={"source": String(255), "target": String(255), "value": Float()},
- index=False,
- )
- print("Creating table [wb_health_population] reference")
- tbl = db.session.query(TBL).filter_by(table_name=tbl_name).first()
- if not tbl:
- tbl = TBL(table_name=tbl_name)
- tbl.description = "Energy consumption"
- tbl.database = database
- if not any(col.metric_name == "sum__value" for col in tbl.metrics):
- col = str(column("value").compile(db.engine))
- tbl.metrics.append(
- SqlMetric(metric_name="sum__value", expression=f"SUM({col})")
- )
- db.session.merge(tbl)
- db.session.commit()
- tbl.fetch_metadata()
- slc = Slice(
- slice_name="Energy Sankey",
- viz_type="sankey",
- datasource_type="table",
- datasource_id=tbl.id,
- params=textwrap.dedent(
- """\
- {
- "collapsed_fieldsets": "",
- "groupby": [
- "source",
- "target"
- ],
- "metric": "sum__value",
- "row_limit": "5000",
- "slice_name": "Energy Sankey",
- "viz_type": "sankey"
- }
- """
- ),
- )
- misc_dash_slices.add(slc.slice_name)
- merge_slice(slc)
- slc = Slice(
- slice_name="Energy Force Layout",
- viz_type="directed_force",
- datasource_type="table",
- datasource_id=tbl.id,
- params=textwrap.dedent(
- """\
- {
- "charge": "-500",
- "collapsed_fieldsets": "",
- "groupby": [
- "source",
- "target"
- ],
- "link_length": "200",
- "metric": "sum__value",
- "row_limit": "5000",
- "slice_name": "Force",
- "viz_type": "directed_force"
- }
- """
- ),
- )
- misc_dash_slices.add(slc.slice_name)
- merge_slice(slc)
- slc = Slice(
- slice_name="Heatmap",
- viz_type="heatmap",
- datasource_type="table",
- datasource_id=tbl.id,
- params=textwrap.dedent(
- """\
- {
- "all_columns_x": "source",
- "all_columns_y": "target",
- "canvas_image_rendering": "pixelated",
- "collapsed_fieldsets": "",
- "linear_color_scheme": "blue_white_yellow",
- "metric": "sum__value",
- "normalize_across": "heatmap",
- "slice_name": "Heatmap",
- "viz_type": "heatmap",
- "xscale_interval": "1",
- "yscale_interval": "1"
- }
- """
- ),
- )
- misc_dash_slices.add(slc.slice_name)
- merge_slice(slc)
|