| 
									
										
										
										
											2018-07-30 23:08:51 +08:00
										 |  |  | /* | 
					
						
							|  |  |  | 	MIT License http://www.opensource.org/licenses/mit-license.php
 | 
					
						
							|  |  |  | 	Author Tobias Koppers @sokra | 
					
						
							|  |  |  | */ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | "use strict"; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // Simulations show these probabilities for a single change
 | 
					
						
							|  |  |  | // 93.1% that one group is invalidated
 | 
					
						
							|  |  |  | // 4.8% that two groups are invalidated
 | 
					
						
							|  |  |  | // 1.1% that 3 groups are invalidated
 | 
					
						
							|  |  |  | // 0.1% that 4 or more groups are invalidated
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // And these for removing/adding 10 lexically adjacent files
 | 
					
						
							|  |  |  | // 64.5% that one group is invalidated
 | 
					
						
							|  |  |  | // 24.8% that two groups are invalidated
 | 
					
						
							|  |  |  | // 7.8% that 3 groups are invalidated
 | 
					
						
							|  |  |  | // 2.7% that 4 or more groups are invalidated
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // And these for removing/adding 3 random files
 | 
					
						
							|  |  |  | // 0% that one group is invalidated
 | 
					
						
							|  |  |  | // 3.7% that two groups are invalidated
 | 
					
						
							|  |  |  | // 80.8% that 3 groups are invalidated
 | 
					
						
							|  |  |  | // 12.3% that 4 groups are invalidated
 | 
					
						
							|  |  |  | // 3.2% that 5 or more groups are invalidated
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * @param {string} a key | 
					
						
							|  |  |  |  * @param {string} b key | 
					
						
							|  |  |  |  * @returns {number} the similarity as number | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | const similarity = (a, b) => { | 
					
						
							|  |  |  | 	const l = Math.min(a.length, b.length); | 
					
						
							|  |  |  | 	let dist = 0; | 
					
						
							|  |  |  | 	for (let i = 0; i < l; i++) { | 
					
						
							|  |  |  | 		const ca = a.charCodeAt(i); | 
					
						
							|  |  |  | 		const cb = b.charCodeAt(i); | 
					
						
							|  |  |  | 		dist += Math.max(0, 10 - Math.abs(ca - cb)); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return dist; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * @param {string} a key | 
					
						
							|  |  |  |  * @param {string} b key | 
					
						
							| 
									
										
										
										
											2020-06-16 23:28:53 +08:00
										 |  |  |  * @param {Set<string>} usedNames set of already used names | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  |  * @returns {string} the common part and a single char for the difference | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2020-06-16 23:28:53 +08:00
										 |  |  | const getName = (a, b, usedNames) => { | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	const l = Math.min(a.length, b.length); | 
					
						
							| 
									
										
										
										
											2020-06-16 23:28:53 +08:00
										 |  |  | 	let i = 0; | 
					
						
							|  |  |  | 	while (i < l) { | 
					
						
							|  |  |  | 		if (a.charCodeAt(i) !== b.charCodeAt(i)) { | 
					
						
							|  |  |  | 			i++; | 
					
						
							|  |  |  | 			break; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		i++; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	while (i < l) { | 
					
						
							|  |  |  | 		const name = a.slice(0, i); | 
					
						
							|  |  |  | 		const lowerName = name.toLowerCase(); | 
					
						
							|  |  |  | 		if (!usedNames.has(lowerName)) { | 
					
						
							|  |  |  | 			usedNames.add(lowerName); | 
					
						
							|  |  |  | 			return name; | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 		} | 
					
						
							| 
									
										
										
										
											2020-06-16 23:28:53 +08:00
										 |  |  | 		i++; | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	} | 
					
						
							| 
									
										
										
										
											2020-06-16 23:28:53 +08:00
										 |  |  | 	// names always contain a hash, so this is always unique
 | 
					
						
							|  |  |  | 	// we don't need to check usedNames nor add it
 | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	return a; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | /** | 
					
						
							|  |  |  |  * @param {Record<string, number>} total total size | 
					
						
							|  |  |  |  * @param {Record<string, number>} size single size | 
					
						
							|  |  |  |  * @returns {void} | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | const addSizeTo = (total, size) => { | 
					
						
							|  |  |  | 	for (const key of Object.keys(size)) { | 
					
						
							|  |  |  | 		total[key] = (total[key] || 0) + size[key]; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * @param {Iterable<Node>} nodes some nodes | 
					
						
							|  |  |  |  * @returns {Record<string, number>} total size | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | const sumSize = nodes => { | 
					
						
							|  |  |  | 	const sum = Object.create(null); | 
					
						
							|  |  |  | 	for (const node of nodes) { | 
					
						
							|  |  |  | 		addSizeTo(sum, node.size); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return sum; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | const isTooBig = (size, maxSize) => { | 
					
						
							|  |  |  | 	for (const key of Object.keys(size)) { | 
					
						
							|  |  |  | 		const maxSizeValue = maxSize[key]; | 
					
						
							|  |  |  | 		if (typeof maxSizeValue === "number") { | 
					
						
							|  |  |  | 			if (size[key] > maxSizeValue) return true; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return false; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | const isTooSmall = (size, minSize) => { | 
					
						
							|  |  |  | 	for (const key of Object.keys(size)) { | 
					
						
							|  |  |  | 		const minSizeValue = minSize[key]; | 
					
						
							|  |  |  | 		if (typeof minSizeValue === "number") { | 
					
						
							|  |  |  | 			if (size[key] < minSizeValue) return true; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return false; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | const getToSmallTypes = (size, minSize) => { | 
					
						
							|  |  |  | 	const types = new Set(); | 
					
						
							|  |  |  | 	for (const key of Object.keys(size)) { | 
					
						
							|  |  |  | 		const minSizeValue = minSize[key]; | 
					
						
							|  |  |  | 		if (typeof minSizeValue === "number") { | 
					
						
							|  |  |  | 			if (size[key] < minSizeValue) types.add(key); | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return types; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | const getNumberOfMatchingSizeTypes = (size, types) => { | 
					
						
							|  |  |  | 	let i = 0; | 
					
						
							|  |  |  | 	for (const key of Object.keys(size)) { | 
					
						
							|  |  |  | 		if (types.has(key)) i++; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return i; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | const selectiveSizeSum = (size, types) => { | 
					
						
							|  |  |  | 	let sum = 0; | 
					
						
							|  |  |  | 	for (const key of Object.keys(size)) { | 
					
						
							|  |  |  | 		if (types.has(key)) sum += size[key]; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return sum; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | /** | 
					
						
							|  |  |  |  * @template T | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | class Node { | 
					
						
							|  |  |  | 	/** | 
					
						
							|  |  |  | 	 * @param {T} item item | 
					
						
							|  |  |  | 	 * @param {string} key key | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 	 * @param {Record<string, number>} size size | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	 */ | 
					
						
							|  |  |  | 	constructor(item, key, size) { | 
					
						
							|  |  |  | 		this.item = item; | 
					
						
							|  |  |  | 		this.key = key; | 
					
						
							|  |  |  | 		this.size = size; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * @template T | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | class Group { | 
					
						
							|  |  |  | 	/** | 
					
						
							|  |  |  | 	 * @param {Node<T>[]} nodes nodes | 
					
						
							|  |  |  | 	 * @param {number[]} similarities similarities between the nodes (length = nodes.length - 1) | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 	 * @param {Record<string, number>=} size size of the group | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	 */ | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 	constructor(nodes, similarities, size) { | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 		this.nodes = nodes; | 
					
						
							|  |  |  | 		this.similarities = similarities; | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 		this.size = size || sumSize(nodes); | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 		/** @type {string} */ | 
					
						
							|  |  |  | 		this.key = undefined; | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	/** | 
					
						
							|  |  |  | 	 * @param {function(Node): boolean} filter filter function | 
					
						
							|  |  |  | 	 * @returns {Node[]} removed nodes | 
					
						
							|  |  |  | 	 */ | 
					
						
							|  |  |  | 	popNodes(filter) { | 
					
						
							|  |  |  | 		const newNodes = []; | 
					
						
							|  |  |  | 		const newSimilarities = []; | 
					
						
							|  |  |  | 		const resultNodes = []; | 
					
						
							|  |  |  | 		let lastNode; | 
					
						
							|  |  |  | 		for (let i = 0; i < this.nodes.length; i++) { | 
					
						
							|  |  |  | 			const node = this.nodes[i]; | 
					
						
							|  |  |  | 			if (filter(node)) { | 
					
						
							|  |  |  | 				resultNodes.push(node); | 
					
						
							|  |  |  | 			} else { | 
					
						
							|  |  |  | 				if (newNodes.length > 0) { | 
					
						
							|  |  |  | 					newSimilarities.push( | 
					
						
							|  |  |  | 						lastNode === this.nodes[i - 1] | 
					
						
							|  |  |  | 							? this.similarities[i - 1] | 
					
						
							|  |  |  | 							: similarity(lastNode.key, node.key) | 
					
						
							|  |  |  | 					); | 
					
						
							|  |  |  | 				} | 
					
						
							|  |  |  | 				newNodes.push(node); | 
					
						
							|  |  |  | 				lastNode = node; | 
					
						
							|  |  |  | 			} | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		this.nodes = newNodes; | 
					
						
							|  |  |  | 		this.similarities = newSimilarities; | 
					
						
							|  |  |  | 		this.size = sumSize(newNodes); | 
					
						
							|  |  |  | 		return resultNodes; | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | /** | 
					
						
							|  |  |  |  * @param {Iterable<Node>} nodes nodes | 
					
						
							|  |  |  |  * @returns {number[]} similarities | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | const getSimilarities = nodes => { | 
					
						
							|  |  |  | 	// calculate similarities between lexically adjacent nodes
 | 
					
						
							|  |  |  | 	/** @type {number[]} */ | 
					
						
							|  |  |  | 	const similarities = []; | 
					
						
							|  |  |  | 	let last = undefined; | 
					
						
							|  |  |  | 	for (const node of nodes) { | 
					
						
							|  |  |  | 		if (last !== undefined) { | 
					
						
							|  |  |  | 			similarities.push(similarity(last.key, node.key)); | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		last = node; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 	return similarities; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | /** | 
					
						
							|  |  |  |  * @template T | 
					
						
							|  |  |  |  * @typedef {Object} GroupedItems<T> | 
					
						
							|  |  |  |  * @property {string} key | 
					
						
							|  |  |  |  * @property {T[]} items | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  |  * @property {Record<string, number>} size | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * @template T | 
					
						
							|  |  |  |  * @typedef {Object} Options | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  |  * @property {Record<string, number>} maxSize maximum size of a group | 
					
						
							|  |  |  |  * @property {Record<string, number>} minSize minimum size of a group (preferred over maximum size) | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  |  * @property {Iterable<T>} items a list of items | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  |  * @property {function(T): Record<string, number>} getSize function to get size of an item | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  |  * @property {function(T): string} getKey function to get the key of an item | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * @template T | 
					
						
							|  |  |  |  * @param {Options<T>} options options object | 
					
						
							|  |  |  |  * @returns {GroupedItems<T>[]} grouped items | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | module.exports = ({ maxSize, minSize, items, getSize, getKey }) => { | 
					
						
							|  |  |  | 	/** @type {Group<T>[]} */ | 
					
						
							|  |  |  | 	const result = []; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	const nodes = Array.from( | 
					
						
							|  |  |  | 		items, | 
					
						
							|  |  |  | 		item => new Node(item, getKey(item), getSize(item)) | 
					
						
							|  |  |  | 	); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	/** @type {Node<T>[]} */ | 
					
						
							|  |  |  | 	const initialNodes = []; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 	// lexically ordering of keys
 | 
					
						
							|  |  |  | 	nodes.sort((a, b) => { | 
					
						
							|  |  |  | 		if (a.key < b.key) return -1; | 
					
						
							|  |  |  | 		if (a.key > b.key) return 1; | 
					
						
							|  |  |  | 		return 0; | 
					
						
							|  |  |  | 	}); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	// return nodes bigger than maxSize directly as group
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 	// But make sure that minSize is not violated
 | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	for (const node of nodes) { | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 		if (isTooBig(node.size, maxSize) && !isTooSmall(node.size, minSize)) { | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 			result.push(new Group([node], [])); | 
					
						
							|  |  |  | 		} else { | 
					
						
							|  |  |  | 			initialNodes.push(node); | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (initialNodes.length > 0) { | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 		const initialGroup = new Group(initialNodes, getSimilarities(initialNodes)); | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 		const problemTypes = getToSmallTypes(initialGroup.size, minSize); | 
					
						
							|  |  |  | 		if (problemTypes.size > 0) { | 
					
						
							| 
									
										
										
										
											2020-03-13 00:51:26 +08:00
										 |  |  | 			// We hit an edge case where the working set is already smaller than minSize
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 			// We merge problematic nodes with the smallest result node to keep minSize intact
 | 
					
						
							|  |  |  | 			const problemNodes = initialGroup.popNodes( | 
					
						
							|  |  |  | 				n => getNumberOfMatchingSizeTypes(n.size, problemTypes) > 0 | 
					
						
							|  |  |  | 			); | 
					
						
							|  |  |  | 			// Only merge it with result nodes that have the problematic size type
 | 
					
						
							|  |  |  | 			const possibleResultGroups = result.filter( | 
					
						
							|  |  |  | 				n => getNumberOfMatchingSizeTypes(n.size, problemTypes) > 0 | 
					
						
							|  |  |  | 			); | 
					
						
							|  |  |  | 			if (possibleResultGroups.length > 0) { | 
					
						
							|  |  |  | 				const bestGroup = possibleResultGroups.reduce((min, group) => { | 
					
						
							|  |  |  | 					const minMatches = getNumberOfMatchingSizeTypes(min); | 
					
						
							|  |  |  | 					const groupMatches = getNumberOfMatchingSizeTypes(group); | 
					
						
							|  |  |  | 					if (minMatches !== groupMatches) | 
					
						
							|  |  |  | 						return minMatches < groupMatches ? group : min; | 
					
						
							|  |  |  | 					if ( | 
					
						
							|  |  |  | 						selectiveSizeSum(min.size, problemTypes) > | 
					
						
							|  |  |  | 						selectiveSizeSum(group.size, problemTypes) | 
					
						
							|  |  |  | 					) | 
					
						
							|  |  |  | 						return group; | 
					
						
							|  |  |  | 					return min; | 
					
						
							|  |  |  | 				}); | 
					
						
							|  |  |  | 				for (const node of problemNodes) bestGroup.nodes.push(node); | 
					
						
							|  |  |  | 				bestGroup.nodes.sort((a, b) => { | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					if (a.key < b.key) return -1; | 
					
						
							|  |  |  | 					if (a.key > b.key) return 1; | 
					
						
							|  |  |  | 					return 0; | 
					
						
							|  |  |  | 				}); | 
					
						
							|  |  |  | 			} else { | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 				// There are no other nodes with the same size types
 | 
					
						
							|  |  |  | 				// We create a new group and have to accept that it's smaller than minSize
 | 
					
						
							|  |  |  | 				result.push(new Group(problemNodes, null)); | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 			} | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 		} | 
					
						
							|  |  |  | 		if (initialGroup.nodes.length > 0) { | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 			const queue = [initialGroup]; | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 			while (queue.length) { | 
					
						
							|  |  |  | 				const group = queue.pop(); | 
					
						
							|  |  |  | 				// only groups bigger than maxSize need to be splitted
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 				if (!isTooBig(group.size, maxSize)) { | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					result.push(group); | 
					
						
							|  |  |  | 					continue; | 
					
						
							|  |  |  | 				} | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 				// find unsplittable area from left and right
 | 
					
						
							|  |  |  | 				// going minSize from left and right
 | 
					
						
							|  |  |  | 				// at least one node need to be included otherwise we get stuck
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 				let left = 1; | 
					
						
							|  |  |  | 				let leftSize = Object.create(null); | 
					
						
							|  |  |  | 				addSizeTo(leftSize, group.nodes[0].size); | 
					
						
							|  |  |  | 				while (isTooSmall(leftSize, minSize)) { | 
					
						
							|  |  |  | 					addSizeTo(leftSize, group.nodes[left].size); | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					left++; | 
					
						
							|  |  |  | 				} | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 				let right = group.nodes.length - 2; | 
					
						
							|  |  |  | 				let rightSize = Object.create(null); | 
					
						
							|  |  |  | 				addSizeTo(rightSize, group.nodes[group.nodes.length - 1].size); | 
					
						
							|  |  |  | 				while (isTooSmall(rightSize, minSize)) { | 
					
						
							|  |  |  | 					addSizeTo(rightSize, group.nodes[right].size); | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					right--; | 
					
						
							|  |  |  | 				} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 				if (left - 1 > right) { | 
					
						
							|  |  |  | 					// can't split group while holding minSize
 | 
					
						
							|  |  |  | 					// because minSize is preferred of maxSize we return
 | 
					
						
							| 
									
										
										
										
											2018-12-04 23:40:06 +08:00
										 |  |  | 					// the problematic nodes as result here even while it's too big
 | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					// To avoid this make sure maxSize > minSize * 3
 | 
					
						
							|  |  |  | 					result.push(group); | 
					
						
							|  |  |  | 					continue; | 
					
						
							|  |  |  | 				} | 
					
						
							|  |  |  | 				if (left <= right) { | 
					
						
							|  |  |  | 					// when there is a area between left and right
 | 
					
						
							|  |  |  | 					// we look for best split point
 | 
					
						
							|  |  |  | 					// we split at the minimum similarity
 | 
					
						
							|  |  |  | 					// here key space is separated the most
 | 
					
						
							|  |  |  | 					let best = left - 1; | 
					
						
							|  |  |  | 					let bestSimilarity = group.similarities[best]; | 
					
						
							|  |  |  | 					for (let i = left; i <= right; i++) { | 
					
						
							|  |  |  | 						const similarity = group.similarities[i]; | 
					
						
							|  |  |  | 						if (similarity < bestSimilarity) { | 
					
						
							|  |  |  | 							best = i; | 
					
						
							|  |  |  | 							bestSimilarity = similarity; | 
					
						
							|  |  |  | 						} | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 					} | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					left = best + 1; | 
					
						
							|  |  |  | 					right = best; | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 				} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 				// create two new groups for left and right area
 | 
					
						
							|  |  |  | 				// and queue them up
 | 
					
						
							|  |  |  | 				const rightNodes = [group.nodes[right + 1]]; | 
					
						
							|  |  |  | 				/** @type {number[]} */ | 
					
						
							| 
									
										
										
										
											2020-03-13 00:51:26 +08:00
										 |  |  | 				const rightSimilarities = []; | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 				for (let i = right + 2; i < group.nodes.length; i++) { | 
					
						
							| 
									
										
										
										
											2020-03-13 00:51:26 +08:00
										 |  |  | 					rightSimilarities.push(group.similarities[i - 1]); | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					rightNodes.push(group.nodes[i]); | 
					
						
							|  |  |  | 				} | 
					
						
							| 
									
										
										
										
											2020-03-13 00:51:26 +08:00
										 |  |  | 				queue.push(new Group(rightNodes, rightSimilarities)); | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 				const leftNodes = [group.nodes[0]]; | 
					
						
							|  |  |  | 				/** @type {number[]} */ | 
					
						
							| 
									
										
										
										
											2020-03-13 00:51:26 +08:00
										 |  |  | 				const leftSimilarities = []; | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 				for (let i = 1; i < left; i++) { | 
					
						
							| 
									
										
										
										
											2020-03-13 00:51:26 +08:00
										 |  |  | 					leftSimilarities.push(group.similarities[i - 1]); | 
					
						
							| 
									
										
										
										
											2018-11-24 16:17:16 +08:00
										 |  |  | 					leftNodes.push(group.nodes[i]); | 
					
						
							|  |  |  | 				} | 
					
						
							| 
									
										
										
										
											2020-03-13 00:51:26 +08:00
										 |  |  | 				queue.push(new Group(leftNodes, leftSimilarities)); | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 			} | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	// lexically ordering
 | 
					
						
							|  |  |  | 	result.sort((a, b) => { | 
					
						
							|  |  |  | 		if (a.nodes[0].key < b.nodes[0].key) return -1; | 
					
						
							|  |  |  | 		if (a.nodes[0].key > b.nodes[0].key) return 1; | 
					
						
							|  |  |  | 		return 0; | 
					
						
							|  |  |  | 	}); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	// give every group a name
 | 
					
						
							| 
									
										
										
										
											2020-06-16 23:28:53 +08:00
										 |  |  | 	const usedNames = new Set(); | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	for (let i = 0; i < result.length; i++) { | 
					
						
							|  |  |  | 		const group = result[i]; | 
					
						
							| 
									
										
										
										
											2020-06-16 23:28:53 +08:00
										 |  |  | 		if (group.nodes.length === 1) { | 
					
						
							|  |  |  | 			group.key = group.nodes[0].key; | 
					
						
							|  |  |  | 		} else { | 
					
						
							|  |  |  | 			const first = group.nodes[0]; | 
					
						
							|  |  |  | 			const last = group.nodes[group.nodes.length - 1]; | 
					
						
							|  |  |  | 			const name = getName(first.key, last.key, usedNames); | 
					
						
							|  |  |  | 			group.key = name; | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2018-07-04 15:59:22 +08:00
										 |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	// return the results
 | 
					
						
							|  |  |  | 	return result.map(group => { | 
					
						
							|  |  |  | 		/** @type {GroupedItems} */ | 
					
						
							|  |  |  | 		return { | 
					
						
							|  |  |  | 			key: group.key, | 
					
						
							|  |  |  | 			items: group.nodes.map(node => node.item), | 
					
						
							|  |  |  | 			size: group.size | 
					
						
							|  |  |  | 		}; | 
					
						
							|  |  |  | 	}); | 
					
						
							|  |  |  | }; |