# Get postgres image in version 16.1 as base
FROM postgres:16.1

# Update and install cron and vim
RUN apt-get update && apt-get install -y cron vim

# Set cron time zone to Sao Paulo
RUN echo "America/Sao_Paulo" > /etc/timezone

# Set the container time zone to Sao Paulo
RUN ln -sf /usr/share/zoneinfo/America/Sao_Paulo /etc/localtime

# Copy crontab file with schedule settings
COPY crontab /var/spool/cron/crontabs/root

# Copy the shell scripts to be executed by crontab
COPY drop_view.sh /tmp
COPY create_view.sh /tmp

# Give execution permission to the files
RUN chmod +x /tmp/drop_view.sh
RUN chmod +x /tmp/create_view.sh

docker build -t postgres-cron-vim:16.1 .

CREATE FUNCTION cont_dias_sprint(sprint_name VARCHAR)
RETURNS SETOF NUMERIC AS $$
-- Select the number of Sprint days minus 1 for division in the planned column
SELECT COUNT(intervalo) - 1
FROM generate_series(
    -- Generate a series of dates between the start and end days of the sprint
    (SELECT "startDate" FROM public.sprints WHERE name = sprint_name),
    (SELECT "endDate" FROM public.sprints WHERE name = sprint_name),
    INTERVAL '1 day'
) AS intervalo
-- Extract the days of the week and filter to remove Saturday and Sunday
WHERE EXTRACT(dow FROM intervalo) NOT IN (6, 0);
$$ LANGUAGE sql;

CREATE FUNCTION estimado_total(sprint_name VARCHAR)
RETURNS SETOF NUMERIC AS $$
-- Sum the estimate for each card and bring it into relation with the sprint
SELECT SUM((CAST((i.fields -> 'timeoriginalestimate') AS INTEGER))/3600)
FROM public.issues AS i
JOIN public.sprint_issues AS si ON i.key = si.key
JOIN public.sprints AS s ON si."sprintId" = s.Id
WHERE s.name = sprint_name
GROUP BY s.name;
$$ LANGUAGE sql;

CREATE OR REPLACE FUNCTION planejado_ideal(sprint_name VARCHAR)
RETURNS TABLE (dia DATE, planejado NUMERIC) AS $$

DECLARE
  -- Declare variable to be used in the loop starting with the total estimated value for the sprint
  current_value NUMERIC(8,6) := estimado_total(sprint_name);
  -- Declare increment variable
  increment_value NUMERIC(8,6) := estimado_total(sprint_name) / cont_dias_sprint(sprint_name);

BEGIN

  FOR dia IN
    -- Loop to run through sprint days
    SELECT intervalo
    FROM generate_series(
        (SELECT "startDate" FROM public.sprints WHERE name = sprint_name),
        (SELECT "endDate" FROM public.sprints WHERE name = sprint_name),
        INTERVAL '1 day') AS intervalo
    WHERE EXTRACT(dow FROM intervalo) NOT IN (6, 0)
  LOOP
    -- Starting with the first value as the estimated sprint total
    planejado := current_value;
    RETURN NEXT;
    -- Update next column value being the previous one minus the increment
    current_value := current_value - increment_value;
  END LOOP;

  RETURN;

END;

$$ LANGUAGE plpgsql;

CREATE OR REPLACE FUNCTION horas_restantes(sprint_name VARCHAR, prev_horas_entregues NUMERIC, datas DATE)
RETURNS TABLE(dia DATE, horas_restantes NUMERIC) AS $$

DECLARE
    -- Set cursor to run through all days of each sprint
    tbl_cursor CURSOR FOR (
        SELECT s.name AS sprint, data.data :: DATE
        FROM public.sprints AS s
        CROSS JOIN generate_series(s."startDate", s."endDate", interval '1 day') AS data
        WHERE EXTRACT(dow FROM data.data) NOT IN (6, 0) AND s.name = sprint_name
        ORDER BY data
    );
    tbl_row RECORD;
    -- Set initial value as estimated total for sprint
    horas_restantes NUMERIC := estimado_total(sprint_name);
    -- Define control variables so that in each iteration can be select the previous day's delivered hours
    horas_entregues NUMERIC := 0;
    current_value NUMERIC := 0;

BEGIN

    OPEN tbl_cursor;

    LOOP
        -- Set stopping criteria for the cursor
        FETCH FROM tbl_cursor INTO tbl_row;
        EXIT WHEN NOT FOUND;
        -- Select delivered hours
        SELECT COALESCE(SUM((issues.fields ->> 'timeoriginalestimate')::INTEGER / 3600), 0)
        INTO horas_entregues
        FROM issues
        WHERE to_date(issues.fields ->> 'resolutiondate', 'YYYY-MM-DD') = tbl_row.data;
        -- Subtract the value in the remaining hours column from the value of delivered hours
        horas_restantes := horas_restantes - current_value;
        -- Store the value of delivered hours on date x, so that in the next interaction this value 
        -- will be subtracted, representing the value of hours delivered on the previous date (x-1)
        current_value := horas_entregues;
        -- Returning the date and remaining hours in each iteration
        RETURN QUERY SELECT tbl_row.data, horas_restantes;
    END LOOP;

    CLOSE tbl_cursor;

END;

$$ LANGUAGE plpgsql;

CREATE OR REPLACE VIEW public.vw_dadosburndown AS
WITH dados_sprint AS (
    SELECT 
        s.name AS sprint, 
        data.data :: DATE
    FROM public.sprints AS s
    CROSS JOIN generate_series(s."startDate", s."endDate", INTERVAL '1 day') AS data
    WHERE EXTRACT(dow FROM data.data) NOT IN (6, 0)
    ORDER BY data
),
dados_horas_entregues AS(
    SELECT 
        SUM((CAST((fields -> 'timeoriginalestimate') AS INTEGER))/3600) AS horas_entregues,
        to_date(fields ->> 'resolutiondate', 'YYYY-MM-DD') AS data_encerramento
    FROM public.issues
    GROUP BY data_encerramento
),
prev_dados_tempo_gasto AS(
    SELECT
        CAST((jsonb_array_elements(fields -> 'worklog' -> 'worklogs') -> 'timeSpentSeconds') AS INTEGER)/3600 AS tempo_gasto,
        to_date(jsonb_array_elements(fields -> 'worklog' -> 'worklogs') ->> 'updated', 'YYYY-MM-DD') AS dia_gasto
    FROM public.issues
),
dados_tempo_gasto AS(   
    SELECT
        dia_gasto,
        SUM(tempo_gasto) AS tempo_gasto
    FROM prev_dados_tempo_gasto
    GROUP BY dia_gasto
)
SELECT
    ds.sprint,
    ds.data,
    dhe.horas_entregues,
    dtg.tempo_gasto,
    plan.planejado,
    he.horas_restantes
FROM dados_sprint AS ds
LEFT JOIN LATERAL planejado_ideal(ds.sprint) AS plan ON ds.data = plan.dia
LEFT JOIN dados_horas_entregues AS dhe ON ds.data = dhe.data_encerramento
LEFT JOIN dados_tempo_gasto AS dtg ON ds.data = dtg.dia_gasto
JOIN horas_restantes(ds.sprint, dhe.horas_entregues, ds.data) AS he ON ds.data = he.dia
ORDER BY ds.sprint,ds.data;

#!/bin/bash

# Set environment variables for PostgreSQL
export PGHOST=localhost
export PGUSER=user
export PGPASSWORD=XXXXX
export PGDATABASE=DashboardScrum

# Execute the drop view command
psql -c "DROP VIEW public.vw_dadosburndown;"

#!/bin/bash

# Set environment variables for PostgreSQL
export PGHOST=localhost
export PGUSER=gpb
export PGPASSWORD=gpb5579
export PGDATABASE=DashboardScrum

# Variable with view creation
VIEW_DEFINITION="
CREATE OR REPLACE VIEW public.vw_dadosburndown AS
WITH dados_sprint AS (
  SELECT 
      s.name AS sprint, 
      data.data :: DATE
  FROM public.sprints AS s
  CROSS JOIN generate_series(s.\"startDate\", s.\"endDate\", INTERVAL '1 day') AS data
  WHERE EXTRACT(dow FROM data.data) NOT IN (6, 0)
  ORDER BY data
),
dados_horas_entregues AS(
  SELECT 
    SUM((CAST((fields -> 'timeoriginalestimate') AS INTEGER))/3600) AS horas_entregues,
    to_date(fields ->> 'resolutiondate', 'YYYY-MM-DD') AS data_encerramento
  FROM public.issues
  GROUP BY data_encerramento
),
prev_dados_tempo_gasto AS(
  SELECT
    CAST((jsonb_array_elements(fields -> 'worklog' -> 'worklogs') -> 'timeSpentSeconds') AS INTEGER)/3600 AS tempo_gasto,
    to_date(jsonb_array_elements(fields -> 'worklog' -> 'worklogs') ->> 'updated', 'YYYY-MM-DD') AS dia_gasto
  FROM public.issues
),
dados_tempo_gasto AS( 
  SELECT
    dia_gasto,
    SUM(tempo_gasto) AS tempo_gasto
  FROM prev_dados_tempo_gasto
  GROUP BY dia_gasto
)
SELECT
  ds.sprint,
  ds.data,
  dhe.horas_entregues,
  dtg.tempo_gasto,
  plan.planejado,
  he.horas_restantes
FROM dados_sprint AS ds
LEFT JOIN LATERAL planejado_ideal(ds.sprint) AS plan ON ds.data = plan.dia
LEFT JOIN dados_horas_entregues AS dhe ON ds.data = dhe.data_encerramento
LEFT JOIN dados_tempo_gasto AS dtg ON ds.data = dtg.dia_gasto
JOIN horas_restantes(ds.sprint, dhe.horas_entregues, ds.data) AS he ON ds.data = he.dia
ORDER BY ds.sprint,ds.data;"

# Executing the view creation command
psql -c "$VIEW_DEFINITION"

0 3 * * 1-5 /tmp/drop_view.sh >> /tmp/cron_drop.log 2>&1
0 5 * * 1-5 /tmp/create_view.sh >> /tmp/cron_create.log 2>&1

service cron start

Dashboard Scrum¶

Summary

1. Business problem ¶

2. Solution proposal ¶

2.1 Tools and cost ¶

3. Set up the source on Airbyte ¶

4. Preparing the database ¶

4.1 Using Docker ¶

4.2 Dockerfile build ¶

4.3 Creating image and container on Docker ¶

4.4 Accessing the database ¶

5. Set up the destination on Airbyte ¶

6. Set up the connection on Airbyte ¶

7. Data transform ¶

7.1 Function that returns the sprint day count ¶

7.2 Function that returns the estimated total hours of the sprint ¶

7.3 Function that determines ideal planning line ¶

7.4 Function that calculates remaining hours ¶

7.5 View ¶

8. Data visualization ¶

8.1 Connection to Power Bi ¶

8.2 Burndown with Time Spent Chart ¶

9. Updating the data ¶

9.1 Command to delete view (drop_view.sh) ¶

9.2 Command to create view (create_view.sh) ¶

9.3 Scheduling command in CRON (crontab) ¶

9.4 Starting CRON in the container ¶

9.5 Scheduling update in Airbyte ¶

10. Conclusion ¶

Contact¶