Lines Matching refs:dataset

56     protected $dataset;  variable in Rubix\\ML\\Tests\\Datasets\\LabeledTest
63 $this->dataset = new Labeled(self::SAMPLES, self::LABELS, false);
73 $this->assertInstanceOf(Labeled::class, $this->dataset);
74 $this->assertInstanceOf(Dataset::class, $this->dataset);
75 $this->assertInstanceOf(Countable::class, $this->dataset);
76 $this->assertInstanceOf(ArrayAccess::class, $this->dataset);
77 $this->assertInstanceOf(IteratorAggregate::class, $this->dataset);
78 $this->assertInstanceOf(Stringable::class, $this->dataset);
86 $dataset = Labeled::fromIterator(new NDJSON('tests/test.ndjson'));
88 $this->assertInstanceOf(Labeled::class, $dataset);
89 $this->assertEquals(self::SAMPLES, $dataset->samples());
90 $this->assertEquals(self::LABELS, $dataset->labels());
102 $dataset = Labeled::stack([$dataset1, $dataset2, $dataset3]);
104 $this->assertInstanceOf(Labeled::class, $dataset);
106 $this->assertEquals(3, $dataset->numRows());
107 $this->assertEquals(1, $dataset->numColumns());
115 $this->assertEquals(self::SAMPLES, $this->dataset->samples());
123 $this->assertEquals(self::SAMPLES[2], $this->dataset->sample(2));
124 $this->assertEquals(self::SAMPLES[5], $this->dataset->sample(5));
132 $this->assertEquals(6, $this->dataset->numRows());
142 $this->assertEquals($expected, $this->dataset->column(2));
150 $this->assertEquals(4, $this->dataset->numColumns());
158 $this->assertEquals(DataType::categorical(), $this->dataset->columnType(0));
159 $this->assertEquals(DataType::categorical(), $this->dataset->columnType(1));
160 $this->assertEquals(DataType::categorical(), $this->dataset->columnType(2));
161 $this->assertEquals(DataType::continuous(), $this->dataset->columnType(3));
176 $this->assertEquals($expected, $this->dataset->columnTypes());
184 $this->assertCount(2, $this->dataset->uniqueTypes());
192 $this->assertFalse($this->dataset->homogeneous());
200 $this->assertEquals([6, 4], $this->dataset->shape());
208 $this->assertEquals(24, $this->dataset->size());
218 $this->assertEquals($expected, $this->dataset->columns());
226 $dataset = $this->dataset->transformColumn(3, 'abs');
230 $this->assertEquals($expected, $dataset->column(3));
240 $columns = $this->dataset->columnsByType(DataType::categorical());
250 $this->assertFalse($this->dataset->empty());
258 $this->assertEquals(self::LABELS, $this->dataset->labels());
270 $this->dataset->transformLabels($transformer);
276 $this->assertEquals($expected, $this->dataset->labels());
284 $this->assertEquals('not monster', $this->dataset->label(0));
285 $this->assertEquals('monster', $this->dataset->label(1));
293 $this->assertEquals(DataType::categorical(), $this->dataset->labelType());
303 $this->dataset->possibleOutcomes()
312 $samples = $this->dataset->samples();
313 $labels = $this->dataset->labels();
315 $this->dataset->randomize();
317 $this->assertNotEquals($samples, $this->dataset->samples());
318 $this->assertNotEquals($labels, $this->dataset->labels());
330 $filtered = $this->dataset->filterByColumn(2, $isFriendly);
354 $filtered = $this->dataset->filterByLabel($notMonster);
374 $this->dataset->sortByColumn(1);
382 $this->assertEquals($sorted, $this->dataset->column(1));
383 $this->assertEquals($labels, $this->dataset->labels());
391 $this->dataset->sortByLabel();
398 $this->assertEquals($samples, $this->dataset->samples());
399 $this->assertEquals($labels, $this->dataset->labels());
407 $subset = $this->dataset->head(3);
418 $subset = $this->dataset->tail(3);
429 $this->assertCount(6, $this->dataset);
431 $subset = $this->dataset->take(3);
434 $this->assertCount(3, $this->dataset);
442 $this->assertCount(6, $this->dataset);
444 $subset = $this->dataset->leave(1);
447 $this->assertCount(1, $this->dataset);
455 $this->assertCount(6, $this->dataset);
457 $subset = $this->dataset->slice(2, 2);
461 $this->assertCount(6, $this->dataset);
469 $this->assertCount(6, $this->dataset);
471 $subset = $this->dataset->splice(2, 2);
475 $this->assertCount(4, $this->dataset);
483 [$left, $right] = $this->dataset->split(0.5);
494 [$left, $right] = $this->dataset->stratifiedSplit(0.5);
505 $folds = $this->dataset->fold(2);
517 $folds = $this->dataset->stratifiedFold(2);
529 $strata = $this->dataset->stratify();
540 $batches = $this->dataset->batch(2);
553 [$left, $right] = $this->dataset->splitByColumn(1, 'rough');
567 $subset = $this->dataset->randomSubset(3);
577 $subset = $this->dataset->randomSubsetWithReplacement(3);
587 $subset = $this->dataset->randomWeightedSubsetWithReplacement(3, self::WEIGHTS);
597 $this->assertCount(count(self::SAMPLES), $this->dataset);
599 $dataset = new Labeled([['nice', 'furry', 'friendly', 4.7]], ['not monster']);
601 $merged = $this->dataset->merge($dataset);
614 $this->assertEquals(count(current(self::SAMPLES)), $this->dataset->numColumns());
616 $dataset = new Unlabeled([
625 $joined = $this->dataset->join($dataset);
639 $dataset = $this->dataset->dropRow(1);
651 $this->assertInstanceOf(Labeled::class, $dataset);
652 $this->assertEquals($samples, $dataset->samples());
653 $this->assertEquals($labels, $dataset->labels());
661 $dataset = $this->dataset->dropRows([1, 5]);
672 $this->assertInstanceOf(Labeled::class, $dataset);
673 $this->assertEquals($samples, $dataset->samples());
674 $this->assertEquals($labels, $dataset->labels());
682 $dataset = $this->dataset->dropColumn(2);
698 $this->assertInstanceOf(Labeled::class, $dataset);
699 $this->assertEquals($samples, $dataset->samples());
700 $this->assertEquals($labels, $dataset->labels());
708 $dataset = $this->dataset->dropColumns([0, 2]);
724 $this->assertInstanceOf(Labeled::class, $dataset);
725 $this->assertEquals($samples, $dataset->samples());
726 $this->assertEquals($labels, $dataset->labels());
778 $results = $this->dataset->describe();
876 $results = $this->dataset->describeByLabel();
896 $results = $this->dataset->describeLabels();
907 $dataset = $this->dataset->deduplicate();
909 $this->assertCount(6, $dataset);
926 $this->assertEquals($expected, $this->dataset->toArray());
936 $encoding = $this->dataset->toJSON();
954 $encoding = $this->dataset->toNDJSON();
973 $encoding = $this->dataset->toCSV([
986 $this->assertEquals(6, $this->dataset->count());
987 $this->assertCount(6, $this->dataset);
997 $this->assertEquals($expected, $this->dataset[1]);
1014 $this->assertEquals($expected, iterator_to_array($this->dataset));