debian-mirror-gitlab/app/assets/javascripts/pipelines/components/parsing_utils.js

import { uniqWith, isEqual } from 'lodash';

/*
    The following functions are the main engine in transforming the data as
    received from the endpoint into the format the d3 graph expects.

    Input is of the form:
    [nodes]
      nodes: [{category, name, jobs, size}]
        category is the stage name
        name is a group name; in the case that the group has one job, it is
          also the job name
        size is the number of parallel jobs
        jobs: [{ name, needs}]
          job name is either the same as the group name or group x/y
          needs: [job-names]
          needs is an array of job-name strings

    Output is of the form:
    { nodes: [node], links: [link] }
      node: { name, category }, + unused info passed through
      link: { source, target, value }, with source & target being node names
        and value being a constant

    We create nodes in the GraphQL update function, and then here we create the node dictionary,
    then create links, and then dedupe the links, so that in the case where
    job 4 depends on job 1 and job 2, and job 2 depends on job 1, we show only a single link
    from job 1 to job 2 then another from job 2 to job 4.

    CREATE LINKS
    nodes.name -> target
    nodes.name.needs.each -> source (source is the name of the group, not the parallel job)
    10 -> value (constant)
  */

export const createNodeDict = nodes => {
  return nodes.reduce((acc, node) => {
    const newNode = {
      ...node,
      needs: node.jobs.map(job => job.needs || []).flat(),
    };

    if (node.size > 1) {
      node.jobs.forEach(job => {
        acc[job.name] = newNode;
      });
    }

    acc[node.name] = newNode;
    return acc;
  }, {});
};

export const makeLinksFromNodes = (nodes, nodeDict) => {
  const constantLinkValue = 10; // all links are the same weight
  return nodes
    .map(group => {
      return group.jobs.map(job => {
        if (!job.needs) {
          return [];
        }

        return job.needs.map(needed => {
          return {
            source: nodeDict[needed]?.name,
            target: group.name,
            value: constantLinkValue,
          };
        });
      });
    })
    .flat(2);
};

export const getAllAncestors = (nodes, nodeDict) => {
  const needs = nodes
    .map(node => {
      return nodeDict[node].needs || '';
    })
    .flat()
    .filter(Boolean);

  if (needs.length) {
    return [...needs, ...getAllAncestors(needs, nodeDict)];
  }

  return [];
};

export const filterByAncestors = (links, nodeDict) =>
  links.filter(({ target, source }) => {
    /*

    for every link, check out it's target
    for every target, get the target node's needs
    then drop the current link source from that list

    call a function to get all ancestors, recursively
    is the current link's source in the list of all parents?
    then we drop this link

  */
    const targetNode = target;
    const targetNodeNeeds = nodeDict[targetNode].needs;
    const targetNodeNeedsMinusSource = targetNodeNeeds.filter(need => need !== source);

    const allAncestors = getAllAncestors(targetNodeNeedsMinusSource, nodeDict);
    return !allAncestors.includes(source);
  });

export const parseData = nodes => {
  const nodeDict = createNodeDict(nodes);
  const allLinks = makeLinksFromNodes(nodes, nodeDict);
  const filteredLinks = filterByAncestors(allLinks, nodeDict);
  const links = uniqWith(filteredLinks, isEqual);

  return { nodes, links };
};

/*
  The number of nodes in the most populous generation drives the height of the graph.
*/

export const getMaxNodes = nodes => {
  const counts = nodes.reduce((acc, { layer }) => {
    if (!acc[layer]) {
      acc[layer] = 0;
    }

    acc[layer] += 1;

    return acc;
  }, []);

  return Math.max(...counts);
};

/*
  Because we cannot know if a node is part of a relationship until after we
  generate the links with createSankey, this function is used after the first call
  to find nodes that have no relations.
*/

export const removeOrphanNodes = sankeyfiedNodes => {
  return sankeyfiedNodes.filter(node => node.sourceLinks.length || node.targetLinks.length);
};
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`import { uniqWith, isEqual } from 'lodash';`

			`/*`
			`The following functions are the main engine in transforming the data as`
			`received from the endpoint into the format the d3 graph expects.`

			`Input is of the form:`
New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			`[nodes]`
			`nodes: [{category, name, jobs, size}]`
			`category is the stage name`
			`name is a group name; in the case that the group has one job, it is`
			`also the job name`
			`size is the number of parallel jobs`
			`jobs: [{ name, needs}]`
			`job name is either the same as the group name or group x/y`
			`needs: [job-names]`
			`needs is an array of job-name strings`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30
			`Output is of the form:`
			`{ nodes: [node], links: [link] }`
			`node: { name, category }, + unused info passed through`
			`link: { source, target, value }, with source & target being node names`
			`and value being a constant`

New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			`We create nodes in the GraphQL update function, and then here we create the node dictionary,`
			`then create links, and then dedupe the links, so that in the case where`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`job 4 depends on job 1 and job 2, and job 2 depends on job 1, we show only a single link`
			`from job 1 to job 2 then another from job 2 to job 4.`

			`CREATE LINKS`
New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			`nodes.name -> target`
			`nodes.name.needs.each -> source (source is the name of the group, not the parallel job)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`10 -> value (constant)`
			`*/`

			`export const createNodeDict = nodes => {`
			`return nodes.reduce((acc, node) => {`
			`const newNode = {`
			`...node,`
			`needs: node.jobs.map(job => job.needs \|\| []).flat(),`
			`};`

			`if (node.size > 1) {`
			`node.jobs.forEach(job => {`
			`acc[job.name] = newNode;`
			`});`
			`}`

			`acc[node.name] = newNode;`
			`return acc;`
			`}, {});`
			`};`

			`export const makeLinksFromNodes = (nodes, nodeDict) => {`
			`const constantLinkValue = 10; // all links are the same weight`
			`return nodes`
			`.map(group => {`
			`return group.jobs.map(job => {`
			`if (!job.needs) {`
			`return [];`
			`}`

			`return job.needs.map(needed => {`
			`return {`
			`source: nodeDict[needed]?.name,`
			`target: group.name,`
			`value: constantLinkValue,`
			`};`
			`});`
			`});`
			`})`
			`.flat(2);`
			`};`

			`export const getAllAncestors = (nodes, nodeDict) => {`
			`const needs = nodes`
			`.map(node => {`
			`return nodeDict[node].needs \|\| '';`
			`})`
			`.flat()`
			`.filter(Boolean);`

			`if (needs.length) {`
			`return [...needs, ...getAllAncestors(needs, nodeDict)];`
			`}`

			`return [];`
			`};`

			`export const filterByAncestors = (links, nodeDict) =>`
			`links.filter(({ target, source }) => {`
			`/*`

			`for every link, check out it's target`
			`for every target, get the target node's needs`
			`then drop the current link source from that list`

			`call a function to get all ancestors, recursively`
			`is the current link's source in the list of all parents?`
			`then we drop this link`

			`*/`
			`const targetNode = target;`
			`const targetNodeNeeds = nodeDict[targetNode].needs;`
			`const targetNodeNeedsMinusSource = targetNodeNeeds.filter(need => need !== source);`

			`const allAncestors = getAllAncestors(targetNodeNeedsMinusSource, nodeDict);`
			`return !allAncestors.includes(source);`
			`});`

New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			`export const parseData = nodes => {`
			`const nodeDict = createNodeDict(nodes);`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`const allLinks = makeLinksFromNodes(nodes, nodeDict);`
			`const filteredLinks = filterByAncestors(allLinks, nodeDict);`
			`const links = uniqWith(filteredLinks, isEqual);`

			`return { nodes, links };`
			`};`

			`/*`
			`The number of nodes in the most populous generation drives the height of the graph.`
			`*/`

			`export const getMaxNodes = nodes => {`
			`const counts = nodes.reduce((acc, { layer }) => {`
			`if (!acc[layer]) {`
			`acc[layer] = 0;`
			`}`

			`acc[layer] += 1;`

			`return acc;`
			`}, []);`

			`return Math.max(...counts);`
			`};`

			`/*`
			`Because we cannot know if a node is part of a relationship until after we`
			`generate the links with createSankey, this function is used after the first call`
			`to find nodes that have no relations.`
			`*/`

			`export const removeOrphanNodes = sankeyfiedNodes => {`
			`return sankeyfiedNodes.filter(node => node.sourceLinks.length \|\| node.targetLinks.length);`
			`};`