lithium\util\Set

class

Used for complex manipulation, comparison, and access of array data. Some methods allow for XPath-like data access, as follows:

  • '/User/id': Similar to the classic {n}.User.id.
  • '/User[2]/name': Selects the name of the second User.
  • '/User[id>2]': Selects all Users with an id > 2.
  • '/User[id>2][<5]': Selects all Users with an id > 2 but < 5.
  • '/Post/Comment[author_name=John]/../name': Selects the name of all posts that have at least one comment written by John.
  • '/Posts[name]': Selects all Posts that have a 'name' key.
  • '/Comment/.[1]': Selects the contents of the first comment.
  • '/Comment/.[:last]': Selects the last comment.
  • '/Comment/.[:first]': Selects the first comment.
  • '/Comment[text=/lithium/i]': Selects the all comments that have a text matching the regex /lithium/i.
  • '/Comment/@*': Selects all key names of all comments.

Source

class Set {

	/**
	 * Add the keys/values in `$array2` that are not found in `$array` onto the end of `$array`.
	 *
	 * @param mixed $array Original array.
	 * @param mixed $array2 Second array to add onto the original.
	 * @return array An array containing all the keys of the second array not already present in the
	 *         first.
	 */
	public static function append(array $array, array $array2) {
		$arrays = func_get_args();
		$array = array_shift($arrays);
		foreach ($arrays as $array2) {
			if (!$array && $array2) {
				$array = $array2;
				continue;
			}
			foreach ($array2 as $key => $value) {
				if (!array_key_exists($key, $array)) {
					$array[$key] = $value;
				} elseif (is_array($value)) {
					$array[$key] = static::append($array[$key], $array2[$key]);
				}
			}
		}
		return $array;
	}

	/**
	 * Checks if a particular path is set in an array. Tests by key name, or dot-delimited key
	 * name, i.e.:
	 *
	 * ``` embed:lithium\tests\cases\util\SetTest::testCheck(1-4) ```
	 *
	 * @param mixed $data Data to check on.
	 * @param mixed $path A dot-delimited string.
	 * @return boolean `true` if path is found, `false` otherwise.
	 */
	public static function check($data, $path = null) {
		if (!$path) {
			return $data;
		}
		$path = is_array($path) ? $path : explode('.', $path);

		foreach ($path as $i => $key) {
			if (is_numeric($key) && (integer) $key > 0 || $key === '0') {
				$key = (integer) $key;
			}
			if ($i === count($path) - 1) {
				return (is_array($data) && isset($data[$key]));
			} else {
				if (!is_array($data) || !isset($data[$key])) {
					return false;
				}
				$data =& $data[$key];
			}
		}
	}

	/**
	 * Creates an associative array using a `$path1` as the path to build its keys, and optionally
	 * `$path2` as path to get the values. If `$path2` is not specified, all values will be
	 * initialized to `null` (useful for `Set::merge()`). You can optionally group the values by
	 * what is obtained when following the path specified in `$groupPath`.
	 *
	 * @param array $data Array from where to extract keys and values.
	 * @param mixed $path1 As an array, or as a dot-delimited string.
	 * @param mixed $path2 As an array, or as a dot-delimited string.
	 * @param string $groupPath As an array, or as a dot-delimited string.
	 * @return array Combined array.
	 */
	public static function combine($data, $path1 = null, $path2 = null, $groupPath = null) {
		if (!$data) {
			return [];
		}
		if (is_object($data)) {
			$data = get_object_vars($data);
		}
		if (is_array($path1)) {
			$format = array_shift($path1);
			$keys = static::format($data, $format, $path1);
		} else {
			$keys = static::extract($data, $path1);
		}
		$vals = [];
		if (!empty($path2) && is_array($path2)) {
			$format = array_shift($path2);
			$vals = static::format($data, $format, $path2);
		} elseif (!empty($path2)) {
			$vals = static::extract($data, $path2);
		}
		$valCount = count($vals);
		$count = count($keys);

		for ($i = $valCount; $i < $count; $i++) {
			$vals[$i] = null;
		}
		if ($groupPath) {
			$group = static::extract($data, $groupPath);
			if (!empty($group)) {
				$c = count($keys);
				for ($i = 0; $i < $c; $i++) {
					if (!isset($group[$i])) {
						$group[$i] = 0;
					}
					if (!isset($out[$group[$i]])) {
						$out[$group[$i]] = [];
					}
					$out[$group[$i]][$keys[$i]] = $vals[$i];
				}
				return $out;
			}
		}
		return array_combine($keys, $vals);
	}

	/**
	 * Determines if the array elements in `$array2` are wholly contained within `$array1`. Works
	 * recursively.
	 *
	 * @param array $array1 First value.
	 * @param array $array2 Second value.
	 * @return boolean Returns `true` if `$array1` wholly contains the keys and values of `$array2`,
	 *         otherwise, returns `false`. Returns `false` if either array is empty.
	 */
	public static function contains(array $array1, array $array2) {
		if (!$array1 || !$array2) {
			return false;
		}
		foreach ($array2 as $key => $val) {
			if (!isset($array1[$key]) || $array1[$key] !== $val) {
				return false;
			}
			if (is_array($val) && !static::contains($array1[$key], $val)) {
				return false;
			}
		}
		return true;
	}

	/**
	 * Counts the dimensions of an array. If `$all` is set to `false` (which is the default) it will
	 * only consider the dimension of the first element in the array.
	 *
	 * @param array $data Array to count dimensions on.
	 * @param array $options
	 * @return integer The number of dimensions in `$array`.
	 */
	public static function depth($data, array $options = []) {
		$defaults = ['all' => false, 'count' => 0];
		$options += $defaults;

		if (!$data) {
			return 0;
		}

		if (!$options['all']) {
			return (is_array(reset($data))) ? static::depth(reset($data)) + 1 : 1;
		}
		$depth = [$options['count']];

		if (is_array($data) && reset($data) !== false) {
			foreach ($data as $value) {
				$depth[] = static::depth($value, [
					'all' => $options['all'],
					'count' => $options['count'] + 1
				]);
			}
		}
		return max($depth);
	}

	/**
	 * Computes the difference between two arrays.
	 *
	 * @param array $val1 First value.
	 * @param array $val2 Second value.
	 * @return array Computed difference.
	 */
	public static function diff(array $val1, array $val2) {
		if (!$val1 || !$val2) {
			return $val2 ?: $val1;
		}
		$out = [];

		foreach ($val1 as $key => $val) {
			$exists = isset($val2[$key]);

			if (($exists && $val2[$key] !== $val) || !$exists) {
				$out[$key] = $val;
			}
			unset($val2[$key]);
		}

		foreach ($val2 as $key => $val) {
			if (!isset($out[$key])) {
				$out[$key] = $val;
			}
		}
		return $out;
	}

	/**
	 * Implements partial support for XPath 2.0.
	 *
	 * @param array $data An array of data to extract from.
	 * @param string $path An absolute XPath 2.0 path. Only absolute paths starting with a
	 *        single slash are supported right now. Implemented selectors:
	 *        - `'/User/id'`: Similar to the classic {n}.User.id.
	 *        - `'/User[2]/name'`: Selects the name of the second User.
	 *        - `'/User[id>2]'`: Selects all Users with an id > 2.
	 *        - `'/User[id>2][<5]'`: Selects all Users with an id > 2 but < 5.
	 *        - `'/Post/Comment[author_name=John]/../name'`: Selects the name of
	 *          all posts that have at least one comment written by John.
	 *        - `'/Posts[name]'`: Selects all Posts that have a `'name'` key.
	 *        - `'/Comment/.[1]'`: Selects the contents of the first comment.
	 *        - `'/Comment/.[:last]'`: Selects the last comment.
	 *        - `'/Comment/.[:first]'`: Selects the first comment.
	 *        - `'/Comment[text=/lithium/i]`': Selects the all comments that have
	 *          a text matching the regex `/lithium/i`.
	 *        - `'/Comment/@*'`: Selects all key names of all comments.
	 * @param array $options Currently only supports `'flatten'` which can be
	 *              disabled for higher XPath-ness.
	 * @return array An array of matched items.
	 */
	public static function extract(array $data, $path = null, array $options = []) {
		$defaults = ['flatten' => true];
		$options += $defaults;

		if (!$data) {
			return [];
		}
		if ($path === '/') {
			return array_filter($data, function($data) {
				return ($data === 0 || $data === '0' || !empty($data));
			});
		}
		$contexts = $data;

		if (!isset($contexts[0])) {
			$contexts = [$data];
		}

		$tokens = array_slice(preg_split('/(?<!=)\/(?![a-z-]*\])/', $path), 1);

		do {
			$token = array_shift($tokens);
			$conditions = false;

			if (preg_match_all('/\[([^=]+=\/[^\/]+\/|[^\]]+)\]/', $token, $m)) {
				$conditions = $m[1];
				$token = substr($token, 0, strpos($token, '['));
			}
			$matches = [];

			foreach ($contexts as $key => $context) {
				if (!isset($context['trace'])) {
					$context = ['trace' => [null], 'item' => $context, 'key' => $key];
				}
				if ($token === '..') {
					if (count($context['trace']) === 1) {
						$context['trace'][] = $context['key'];
					}

					array_pop($context['trace']);
					$parent = join('/', $context['trace']);
					$context['item'] = static::extract($data, $parent);
					array_pop($context['trace']);
					$context['item'] = array_shift($context['item']);
					$matches[] = $context;
					continue;
				}
				$match = false;

				if ($token === '@*' && is_array($context['item'])) {
					$matches[] = [
						'trace' => array_merge($context['trace'], (array) $key),
						'key' => $key,
						'item' => array_keys($context['item'])
					];
				} elseif (is_array($context['item']) && isset($context['item'][$token])) {
					$items = $context['item'][$token];
					if (!is_array($items)) {
						$items = [$items];
					} elseif (!isset($items[0])) {
						$current = current($items);
						if ((is_array($current) && count($items) <= 1) || !is_array($current)) {
							$items = [$items];
						}
					}

					foreach ($items as $key => $item) {
						$ctext = [$context['key']];
						if (!is_numeric($key)) {
							$ctext[] = $token;
							$token = array_shift($tokens);
							if (isset($items[$token])) {
								$ctext[] = $token;
								$item = $items[$token];
								$matches[] = [
									'trace' => array_merge($context['trace'], $ctext),
									'key' => $key,
									'item' => $item
								];
								break;
							} else {
								array_unshift($tokens, $token);
							}
						} else {
							$ctext[] = $token;
						}

						$matches[] = [
							'trace' => array_merge($context['trace'], $ctext),
							'key' => $key,
							'item' => $item
						];
					}
				} elseif (
					$key === $token || (is_numeric($token) && $key == $token) || $token === '.'
				) {
					$context['trace'][] = $key;
					$matches[] = [
						'trace' => $context['trace'],
						'key' => $key,
						'item' => $context['item']
					];
				}
			}
			if ($conditions) {
				foreach ($conditions as $condition) {
					$filtered = [];
					$length = count($matches);

					foreach ($matches as $i => $match) {
						if (static::matches($match['item'], [$condition], $i + 1, $length)) {
							$filtered[] = $match;
						}
					}
					$matches = $filtered;
				}
			}
			$contexts = $matches;

			if (empty($tokens)) {
				break;
			}
		} while (true);

		$r = [];

		foreach ($matches as $match) {
			$key = array_pop($match['trace']);
			$condition = (!is_int($key) && $key !== null);
			if ((!$options['flatten'] || is_array($match['item'])) && $condition) {
				$r[] = [$key => $match['item']];
			} else {
				$r[] = $match['item'];
			}
		}
		return $r;
	}

	/**
	 * Collapses a multi-dimensional array into a single dimension, using a delimited array path
	 * for each array element's key, i.e. [array('Foo' => ['Bar' => 'Far'])] becomes
	 * ['0.Foo.Bar' => 'Far'].
	 *
	 * @param array $data array to flatten
	 * @param array $options Available options are:
	 *        - `'separator'`: String to separate array keys in path (defaults to `'.'`).
	 *        - `'path'`: Starting point (defaults to null).
	 * @return array
	 */
	public static function flatten($data, array $options = []) {
		$defaults = ['separator' => '.', 'path' => null];
		$options += $defaults;
		$result = [];

		if ($options['path'] !== null) {
			$options['path'] .= $options['separator'];
		}
		foreach ($data as $key => $val) {
			if (!is_array($val)) {
				$result[$options['path'] . $key] = $val;
				continue;
			}
			$opts = ['separator' => $options['separator'], 'path' => $options['path'] . $key];
			$result += (array) static::flatten($val, $opts);
		}
		return $result;
	}

	/**
	 * Accepts a one-dimensional array where the keys are separated by a delimiter.
	 *
	 * @param array $data The one-dimensional array to expand.
	 * @param array $options The options used when expanding the array:
	 *        - `'separator'` _string_: The delimiter to use when separating keys. Defaults
	 *          to `'.'`.
	 * @return array Returns a multi-dimensional array expanded from a one dimensional
	 *         dot-separated array.
	 */
	public static function expand(array $data, array $options = []) {
		$defaults = ['separator' => '.'];
		$options += $defaults;
		$result = [];

		foreach ($data as $key => $val) {
			if (strpos($key, $options['separator']) === false) {
				if (!isset($result[$key])) {
					$result[$key] = $val;
				}
				continue;
			}
			list($path, $key) = explode($options['separator'], $key, 2);
			$path = is_numeric($path) ? (integer) $path : $path;
			$result[$path][$key] = $val;
		}
		foreach ($result as $key => $value) {
			if (is_array($value)) {
				$result[$key] = static::expand($value, $options);
			}
		}
		return $result;
	}

	/**
	 * Returns a series of values extracted from an array, formatted in a format string.
	 *
	 * @param array $data Source array from which to extract the data.
	 * @param string $format Format string into which values will be inserted using `sprintf()`.
	 * @param array $keys An array containing one or more `Set::extract()`-style key paths.
	 * @return array An array of strings extracted from `$keys` and formatted with `$format`.
	 * @link http://php.net/sprintf
	 */
	public static function format($data, $format, $keys) {
		$extracted = [];
		$count = count($keys);

		if (!$count) {
			return;
		}
		for ($i = 0; $i < $count; $i++) {
			$extracted[] = static::extract($data, $keys[$i]);
		}
		$out = [];
		$data = $extracted;
		$count = count($data[0]);

		if (preg_match_all('/\{([0-9]+)\}/msi', $format, $keys2) && isset($keys2[1])) {
			$keys = $keys2[1];
			$format = preg_split('/\{([0-9]+)\}/msi', $format);
			$count2 = count($format);

			for ($j = 0; $j < $count; $j++) {
				$formatted = '';
				for ($i = 0; $i <= $count2; $i++) {
					if (isset($format[$i])) {
						$formatted .= $format[$i];
					}
					if (isset($keys[$i]) && isset($data[$keys[$i]][$j])) {
						$formatted .= $data[$keys[$i]][$j];
					}
				}
				$out[] = $formatted;
			}
			return $out;
		}
		$count2 = count($data);

		for ($j = 0; $j < $count; $j++) {
			$args = [];

			for ($i = 0; $i < $count2; $i++) {
				if (isset($data[$i][$j])) {
					$args[] = $data[$i][$j];
				}
			}
			$out[] = vsprintf($format, $args);
		}
		return $out;
	}

	/**
	 * Inserts `$data` into an array as defined by `$path`.
	 *
	 * @param mixed $list Where to insert into.
	 * @param mixed $path A dot-delimited string.
	 * @param array $data Data to insert.
	 * @return array
	 */
	public static function insert($list, $path, $data = []) {
		if (!is_array($path)) {
			$path = explode('.', $path);
		}
		$_list =& $list;

		foreach ($path as $i => $key) {
			if (is_numeric($key) && (integer) $key > 0 || $key === '0') {
				$key = (integer) $key;
			}
			if ($i === count($path) - 1) {
				$_list[$key] = $data;
			} else {
				if (!isset($_list[$key])) {
					$_list[$key] = [];
				}
				$_list =& $_list[$key];
			}
		}
		return $list;
	}

	/**
	 * Checks to see if all the values in the array are numeric.
	 *
	 * @param array $array The array to check.  If null, the value of the current Set object.
	 * @return mixed `true` if values are numeric, `false` if not and `null` if the array to
	 *               check is empty.
	 */
	public static function isNumeric($array = null) {
		if (empty($array)) {
			return null;
		}
		if ($array === range(0, count($array) - 1)) {
			return true;
		}
		$numeric = true;
		$keys = array_keys($array);
		$count = count($keys);

		for ($i = 0; $i < $count; $i++) {
			if (!is_numeric($array[$keys[$i]])) {
				$numeric = false;
				break;
			}
		}
		return $numeric;
	}

	/**
	 * This function can be used to see if a single item or a given XPath
	 * match certain conditions.
	 *
	 * @param array $data An array of data to execute the match on.
	 * @param mixed $conditions An array of condition strings or an XPath expression.
	 * @param integer $i Optional: The 'nth'-number of the item being matched.
	 * @param integer $length
	 * @return boolean
	 */
	public static function matches($data, $conditions, $i = null, $length = null) {
		if (!$conditions) {
			return true;
		}
		if (is_string($conditions)) {
			return (boolean) static::extract($data, $conditions);
		}
		foreach ($conditions as $condition) {
			if ($condition === ':last') {
				if ($i !== $length) {
					return false;
				}
				continue;
			} elseif ($condition === ':first') {
				if ($i !== 1) {
					return false;
				}
				continue;
			}
			if (!preg_match('/(.+?)([><!]?[=]|[><])(.*)/', $condition, $match)) {
				if (ctype_digit($condition)) {
					if ($i !== (int) $condition) {
						return false;
					}
				} elseif (preg_match_all('/(?:^[0-9]+|(?<=,)[0-9]+)/', $condition, $matches)) {
					return in_array($i, $matches[0]);
				} elseif (!isset($data[$condition])) {
					return false;
				}
				continue;
			}
			list(,$key,$op,$expected) = $match;

			if (!isset($data[$key])) {
				return false;
			}
			$val = $data[$key];

			if ($op === '=' && $expected && $expected[0] === '/') {
				return preg_match($expected, $val);
			} elseif ($op === '=' && $val != $expected) {
				return false;
			} elseif ($op === '!=' && $val == $expected) {
				return false;
			} elseif ($op === '>' && $val <= $expected) {
				return false;
			} elseif ($op === '<' && $val >= $expected) {
				return false;
			} elseif ($op === '<=' && $val > $expected) {
				return false;
			} elseif ($op === '>=' && $val < $expected) {
				return false;
			}
		}
		return true;
	}

	/**
	 * This method can be thought of as a hybrid between PHP's `array_merge()`
	 * and `array_merge_recursive()`.  The difference to the two is that if an
	 * array key contains another array then the function behaves recursive
	 * (unlike `array_merge()`) but does not do if for keys containing strings
	 * (unlike `array_merge_recursive()`).  Please note: This function will work
	 * with an unlimited amount of arguments and typecasts non-array parameters
	 * into arrays.
	 *
	 * @param array $array1 The base array.
	 * @param array $array2 The array to be merged on top of the base array.
	 * @return array Merged array of all passed params.
	 */
	public static function merge(array $array1, array $array2) {
		$args = [$array1, $array2];

		if (!$array1 || !$array2) {
			return $array1 ?: $array2;
		}
		$result = (array) current($args);

		while (($arg = next($args)) !== false) {
			foreach ((array) $arg as $key => $val) {
				if (is_array($val) && isset($result[$key]) && is_array($result[$key])) {
					$result[$key] = static::merge($result[$key], $val);
				} elseif (is_int($key)) {
					$result[] = $val;
				} else {
					$result[$key] = $val;
				}
			}
		}
		return $result;
	}

	/**
	 * Normalizes a string or array list.
	 *
	 * ```
	 * Set::normalize('foo,bar'); // returns ['foo' => null, 'bar' => null];
	 * Set::normalize(['foo', 'bar' => 'baz']; // returns ['foo' => null, 'bar' => 'baz'];
	 * ```
	 *
	 * @param string|array $list List to normalize.
	 * @param boolean $assoc If `true`, `$list` will be converted to an associative array.
	 * @param string $sep If `$list` is a string, it will be split into an array with `$sep`.
	 * @param boolean $trim If `true`, separated strings will be trimmed.
	 * @return array
	 */
	public static function normalize($list, $assoc = true, $sep = ',', $trim = true) {
		if (is_string($list)) {
			$list = explode($sep, $list);
			$list = ($trim) ? array_map('trim', $list) : $list;
			return ($assoc) ? static::normalize($list) : $list;
		}

		if (!is_array($list)) {
			return $list;
		}

		$keys = array_keys($list);
		$count = count($keys);
		$numeric = true;

		if (!$assoc) {
			for ($i = 0; $i < $count; $i++) {
				if (!is_int($keys[$i])) {
					$numeric = false;
					break;
				}
			}
		}

		if (!$numeric || $assoc) {
			$newList = [];
			for ($i = 0; $i < $count; $i++) {
				if (is_int($keys[$i]) && is_scalar($list[$keys[$i]])) {
					$newList[$list[$keys[$i]]] = null;
				} else {
					$newList[$keys[$i]] = $list[$keys[$i]];
				}
			}
			$list = $newList;
		}
		return $list;
	}

	/**
	 * Removes an element from an array as defined by `$path`.
	 *
	 * @param mixed $list From where to remove.
	 * @param mixed $path A dot-delimited string.
	 * @return array Array with `$path` removed from its value.
	 */
	public static function remove($list, $path = null) {
		if (empty($path)) {
			return $list;
		}
		if (!is_array($path)) {
			$path = explode('.', $path);
		}
		$_list =& $list;

		foreach ($path as $i => $key) {
			if (is_numeric($key) && (integer) $key > 0 || $key === '0') {
				$key = (integer) $key;
			}
			if ($i === count($path) - 1) {
				unset($_list[$key]);
			} else {
				if (!isset($_list[$key])) {
					return $list;
				}
				$_list =& $_list[$key];
			}
		}
		return $list;
	}

	/**
	 * Sorts an array by any value, determined by a `Set`-compatible path.
	 *
	 * @param array $data
	 * @param string $path A `Set`-compatible path to the array value.
	 * @param string $dir Either `'asc'` (the default) or `'desc'`.
	 * @return array
	 */
	public static function sort($data, $path, $dir = 'asc') {
		$flatten = function($flatten, $results, $key = null) {
			$stack = [];
			foreach ((array) $results as $k => $r) {
				$id = $k;
				if ($key !== null) {
					$id = $key;
				}
				if (is_array($r)) {
					$stack = array_merge($stack, $flatten($flatten, $r, $id));
				} else {
					$stack[] = ['id' => $id, 'value' => $r];
				}
			}
			return $stack;
		};
		$extract = static::extract($data, $path);
		$result = $flatten($flatten, $extract);

		$keys = static::extract($result, '/id');
		$values = static::extract($result, '/value');

		$dir = ($dir === 'desc') ? SORT_DESC : SORT_ASC;
		array_multisort($values, $dir, $keys, $dir);
		$sorted = [];
		$keys = array_unique($keys);

		foreach ($keys as $k) {
			$sorted[] = $data[$k];
		}
		return $sorted;
	}

	/**
	 * Slices an array into two, separating them determined by an array of keys.
	 *
	 * Usage examples:
	 *
	 * ``` embed:lithium\tests\cases\util\SetTest::testSetSlice(1-4) ```
	 *
	 * @param array $subject Array that gets split apart
	 * @param array|string $keys An array of keys or a single key as string
	 * @return array An array containing both arrays, having the array with requested keys first and
	 *         the remainder as second element
	 */
	public static function slice(array $data, $keys) {
		$removed = array_intersect_key($data, array_fill_keys((array) $keys, true));
		$data = array_diff_key($data, $removed);
		return [$data, $removed];
	}

}