-
-
Notifications
You must be signed in to change notification settings - Fork 189
/
Copy pathTfIdfTransformerTest.php
83 lines (67 loc) · 2.72 KB
/
TfIdfTransformerTest.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
<?php
namespace Rubix\ML\Tests\Transformers;
use Rubix\ML\Persistable;
use Rubix\ML\Datasets\Unlabeled;
use Rubix\ML\Transformers\Elastic;
use Rubix\ML\Transformers\Stateful;
use Rubix\ML\Transformers\Reversible;
use Rubix\ML\Transformers\Transformer;
use Rubix\ML\Transformers\TfIdfTransformer;
use PHPUnit\Framework\TestCase;
/**
* @group Transformers
* @covers \Rubix\ML\Transformers\TfIdfTransformer
*/
class TfIdfTransformerTest extends TestCase
{
/**
* @var TfIdfTransformer
*/
protected $transformer;
/**
* @before
*/
protected function setUp() : void
{
$this->transformer = new TfIdfTransformer(1.0, false);
}
/**
* @test
*/
public function build() : void
{
$this->assertInstanceOf(TfIdfTransformer::class, $this->transformer);
$this->assertInstanceOf(Transformer::class, $this->transformer);
$this->assertInstanceOf(Stateful::class, $this->transformer);
$this->assertInstanceOf(Elastic::class, $this->transformer);
$this->assertInstanceOf(Reversible::class, $this->transformer);
$this->assertInstanceOf(Persistable::class, $this->transformer);
}
/**
* @test
*/
public function fitTransformReverse() : void
{
$dataset = new Unlabeled([
[1, 3, 0, 0, 1, 0, 0, 0, 1, 2, 0, 2, 0, 0, 0, 4, 1, 0, 1],
[0, 1, 1, 0, 0, 2, 1, 0, 0, 0, 0, 3, 0, 1, 0, 0, 0, 0, 0],
[0, 0, 0, 1, 2, 3, 0, 0, 4, 2, 0, 0, 1, 0, 2, 0, 1, 0, 0],
]);
$this->transformer->fit($dataset);
$this->assertTrue($this->transformer->fitted());
$dfs = $this->transformer->dfs();
$this->assertIsArray($dfs);
$this->assertCount(19, $dfs);
$this->assertContainsOnly('int', $dfs);
$original = clone $dataset;
$dataset->apply($this->transformer);
$expected = [
[1.6931471805599454, 3.8630462173553424, 0.0, 0.0, 1.2876820724517808, 0.0, 0.0, 0.0, 1.2876820724517808, 2.5753641449035616, 0.0, 2.5753641449035616, 0.0, 0.0, 0.0, 6.772588722239782, 1.2876820724517808, 0.0, 1.6931471805599454],
[0.0, 1.2876820724517808, 1.6931471805599454, 0.0, 0.0, 2.5753641449035616, 1.6931471805599454, 0.0, 0.0, 0.0, 0.0, 3.8630462173553424, 0.0, 1.6931471805599454, 0.0, 0.0, 0.0, 0.0, 0.0],
[0.0, 0.0, 0.0, 1.6931471805599454, 2.5753641449035616, 3.8630462173553424, 0.0, 0.0, 5.150728289807123, 2.5753641449035616, 0.0, 0.0, 1.6931471805599454, 0.0, 3.386294361119891, 0.0, 1.2876820724517808, 0.0, 0.0],
];
$this->assertEquals($expected, $dataset->samples());
$dataset->reverseApply($this->transformer);
$this->assertEquals($original->samples(), $dataset->samples());
}
}