Search moodle.org's
Developer Documentation

See Release Notes

  • Bug fixes for general core bugs in 3.10.x will end 8 November 2021 (12 months).
  • Bug fixes for security issues in 3.10.x will end 9 May 2022 (18 months).
  • PHP version: minimum PHP 7.2.0 Note: minimum PHP version has increased since Moodle 3.8. PHP 7.3.x and 7.4.x are supported too.

Differences Between: [Versions 310 and 400] [Versions 310 and 401] [Versions 310 and 402] [Versions 310 and 403]

   1  <?php
   2  
   3  declare(strict_types=1);
   4  
   5  namespace Phpml\Clustering\KMeans;
   6  
   7  use InvalidArgumentException;
   8  use LogicException;
   9  use Phpml\Clustering\KMeans;
  10  use SplObjectStorage;
  11  
  12  class Space extends SplObjectStorage
  13  {
  14      /**
  15       * @var int
  16       */
  17      protected $dimension;
  18  
  19      public function __construct(int $dimension)
  20      {
  21          if ($dimension < 1) {
  22              throw new LogicException('a space dimension cannot be null or negative');
  23          }
  24  
  25          $this->dimension = $dimension;
  26      }
  27  
  28      public function toArray(): array
  29      {
  30          $points = [];
  31  
  32          /** @var Point $point */
  33          foreach ($this as $point) {
  34              $points[] = $point->toArray();
  35          }
  36  
  37          return ['points' => $points];
  38      }
  39  
  40      /**
  41       * @param mixed $label
  42       */
  43      public function newPoint(array $coordinates, $label = null): Point
  44      {
  45          if (count($coordinates) !== $this->dimension) {
  46              throw new LogicException('('.implode(',', $coordinates).') is not a point of this space');
  47          }
  48  
  49          return new Point($coordinates, $label);
  50      }
  51  
  52      /**
  53       * @param mixed $label
  54       * @param mixed $data
  55       */
  56      public function addPoint(array $coordinates, $label = null, $data = null): void
  57      {
  58          $this->attach($this->newPoint($coordinates, $label), $data);
  59      }
  60  
  61      /**
  62       * @param object $point
  63       * @param mixed  $data
  64       */
  65      public function attach($point, $data = null): void
  66      {
  67          if (!$point instanceof Point) {
  68              throw new InvalidArgumentException('can only attach points to spaces');
  69          }
  70  
  71          parent::attach($point, $data);
  72      }
  73  
  74      public function getDimension(): int
  75      {
  76          return $this->dimension;
  77      }
  78  
  79      /**
  80       * @return array|bool
  81       */
  82      public function getBoundaries()
  83      {
  84          if (count($this) === 0) {
  85              return false;
  86          }
  87  
  88          $min = $this->newPoint(array_fill(0, $this->dimension, null));
  89          $max = $this->newPoint(array_fill(0, $this->dimension, null));
  90  
  91          /** @var self $point */
  92          foreach ($this as $point) {
  93              for ($n = 0; $n < $this->dimension; ++$n) {
  94                  if ($min[$n] === null || $min[$n] > $point[$n]) {
  95                      $min[$n] = $point[$n];
  96                  }
  97  
  98                  if ($max[$n] === null || $max[$n] < $point[$n]) {
  99                      $max[$n] = $point[$n];
 100                  }
 101              }
 102          }
 103  
 104          return [$min, $max];
 105      }
 106  
 107      public function getRandomPoint(Point $min, Point $max): Point
 108      {
 109          $point = $this->newPoint(array_fill(0, $this->dimension, null));
 110  
 111          for ($n = 0; $n < $this->dimension; ++$n) {
 112              $point[$n] = random_int($min[$n], $max[$n]);
 113          }
 114  
 115          return $point;
 116      }
 117  
 118      /**
 119       * @return Cluster[]
 120       */
 121      public function cluster(int $clustersNumber, int $initMethod = KMeans::INIT_RANDOM): array
 122      {
 123          $clusters = $this->initializeClusters($clustersNumber, $initMethod);
 124  
 125          do {
 126          } while (!$this->iterate($clusters));
 127  
 128          return $clusters;
 129      }
 130  
 131      /**
 132       * @return Cluster[]
 133       */
 134      protected function initializeClusters(int $clustersNumber, int $initMethod): array
 135      {
 136          switch ($initMethod) {
 137              case KMeans::INIT_RANDOM:
 138                  $clusters = $this->initializeRandomClusters($clustersNumber);
 139  
 140                  break;
 141  
 142              case KMeans::INIT_KMEANS_PLUS_PLUS:
 143                  $clusters = $this->initializeKMPPClusters($clustersNumber);
 144  
 145                  break;
 146  
 147              default:
 148                  return [];
 149          }
 150  
 151          $clusters[0]->attachAll($this);
 152  
 153          return $clusters;
 154      }
 155  
 156      /**
 157       * @param Cluster[] $clusters
 158       */
 159      protected function iterate(array $clusters): bool
 160      {
 161          $convergence = true;
 162  
 163          $attach = new SplObjectStorage();
 164          $detach = new SplObjectStorage();
 165  
 166          foreach ($clusters as $cluster) {
 167              foreach ($cluster as $point) {
 168                  $closest = $point->getClosest($clusters);
 169  
 170                  if ($closest !== $cluster) {
 171                      $attach[$closest] ?? $attach[$closest] = new SplObjectStorage();
 172                      $detach[$cluster] ?? $detach[$cluster] = new SplObjectStorage();
 173  
 174                      $attach[$closest]->attach($point);
 175                      $detach[$cluster]->attach($point);
 176  
 177                      $convergence = false;
 178                  }
 179              }
 180          }
 181  
 182          /** @var Cluster $cluster */
 183          foreach ($attach as $cluster) {
 184              $cluster->attachAll($attach[$cluster]);
 185          }
 186  
 187          /** @var Cluster $cluster */
 188          foreach ($detach as $cluster) {
 189              $cluster->detachAll($detach[$cluster]);
 190          }
 191  
 192          foreach ($clusters as $cluster) {
 193              $cluster->updateCentroid();
 194          }
 195  
 196          return $convergence;
 197      }
 198  
 199      /**
 200       * @return Cluster[]
 201       */
 202      protected function initializeKMPPClusters(int $clustersNumber): array
 203      {
 204          $clusters = [];
 205          $this->rewind();
 206  
 207          /** @var Point $current */
 208          $current = $this->current();
 209  
 210          $clusters[] = new Cluster($this, $current->getCoordinates());
 211  
 212          $distances = new SplObjectStorage();
 213  
 214          for ($i = 1; $i < $clustersNumber; ++$i) {
 215              $sum = 0;
 216              /** @var Point $point */
 217              foreach ($this as $point) {
 218                  $closest = $point->getClosest($clusters);
 219                  if ($closest === null) {
 220                      continue;
 221                  }
 222  
 223                  $distance = $point->getDistanceWith($closest);
 224                  $sum += $distances[$point] = $distance;
 225              }
 226  
 227              $sum = random_int(0, (int) $sum);
 228              /** @var Point $point */
 229              foreach ($this as $point) {
 230                  $sum -= $distances[$point];
 231  
 232                  if ($sum > 0) {
 233                      continue;
 234                  }
 235  
 236                  $clusters[] = new Cluster($this, $point->getCoordinates());
 237  
 238                  break;
 239              }
 240          }
 241  
 242          return $clusters;
 243      }
 244  
 245      /**
 246       * @return Cluster[]
 247       */
 248      private function initializeRandomClusters(int $clustersNumber): array
 249      {
 250          $clusters = [];
 251          [$min, $max] = $this->getBoundaries();
 252  
 253          for ($n = 0; $n < $clustersNumber; ++$n) {
 254              $clusters[] = new Cluster($this, $this->getRandomPoint($min, $max)->getCoordinates());
 255          }
 256  
 257          return $clusters;
 258      }
 259  }