You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
161 lines
7.1 KiB
161 lines
7.1 KiB
2 years ago
|
<?php
|
||
|
// This file is part of Moodle - http://moodle.org/
|
||
|
//
|
||
|
// Moodle is free software: you can redistribute it and/or modify
|
||
|
// it under the terms of the GNU General Public License as published by
|
||
|
// the Free Software Foundation, either version 3 of the License, or
|
||
|
// (at your option) any later version.
|
||
|
//
|
||
|
// Moodle is distributed in the hope that it will be useful,
|
||
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
// GNU General Public License for more details.
|
||
|
//
|
||
|
// You should have received a copy of the GNU General Public License
|
||
|
// along with Moodle. If not, see <http://www.gnu.org/licenses/>.
|
||
|
|
||
|
/**
|
||
|
* Unit tests for the dataset manager.
|
||
|
*
|
||
|
* @package core_analytics
|
||
|
* @copyright 2017 David Monllaó {@link http://www.davidmonllao.com}
|
||
|
* @license http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
|
||
|
*/
|
||
|
|
||
|
defined('MOODLE_INTERNAL') || die();
|
||
|
|
||
|
/**
|
||
|
* Unit tests for the dataset manager.
|
||
|
*
|
||
|
* @package core_analytics
|
||
|
* @copyright 2017 David Monllaó {@link http://www.davidmonllao.com}
|
||
|
* @license http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
|
||
|
*/
|
||
|
class dataset_manager_testcase extends advanced_testcase {
|
||
|
|
||
|
/**
|
||
|
* setUp
|
||
|
*
|
||
|
* @return null
|
||
|
*/
|
||
|
public function setUp() {
|
||
|
$this->resetAfterTest(true);
|
||
|
|
||
|
$this->sharedtoprows = array(
|
||
|
array('var1', 'var2'),
|
||
|
array('value1', 'value2'),
|
||
|
array('header1', 'header2')
|
||
|
);
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* test_create_dataset
|
||
|
*
|
||
|
* @return null
|
||
|
*/
|
||
|
public function test_create_dataset() {
|
||
|
|
||
|
$dataset1 = new \core_analytics\dataset_manager(1, 1, 'whatever', \core_analytics\dataset_manager::LABELLED_FILEAREA, false);
|
||
|
$dataset1data = array_merge($this->sharedtoprows, array(array('yeah', 'yeah', 'yeah')));
|
||
|
$f1 = $dataset1->store($dataset1data);
|
||
|
|
||
|
$f1contents = $f1->get_content();
|
||
|
$this->assertContains('yeah', $f1contents);
|
||
|
$this->assertContains('var1', $f1contents);
|
||
|
$this->assertContains('value1', $f1contents);
|
||
|
$this->assertContains('header1', $f1contents);
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* test_merge_datasets
|
||
|
*
|
||
|
* @return null
|
||
|
*/
|
||
|
public function test_merge_datasets() {
|
||
|
|
||
|
$dataset1 = new \core_analytics\dataset_manager(1, 1, 'whatever', \core_analytics\dataset_manager::LABELLED_FILEAREA, false);
|
||
|
$dataset1data = array_merge($this->sharedtoprows, array(array('yeah', 'yeah', 'yeah')));
|
||
|
$f1 = $dataset1->store($dataset1data);
|
||
|
|
||
|
$dataset2 = new \core_analytics\dataset_manager(1, 2, 'whatever', \core_analytics\dataset_manager::LABELLED_FILEAREA, false);
|
||
|
$dataset2data = array_merge($this->sharedtoprows, array(array('no', 'no', 'no')));
|
||
|
$f2 = $dataset2->store($dataset2data);
|
||
|
|
||
|
$files = array($f1, $f2);
|
||
|
$merged = \core_analytics\dataset_manager::merge_datasets($files, 1, 'whatever',
|
||
|
\core_analytics\dataset_manager::LABELLED_FILEAREA);
|
||
|
|
||
|
$mergedfilecontents = $merged->get_content();
|
||
|
$this->assertContains('yeah', $mergedfilecontents);
|
||
|
$this->assertContains('no', $mergedfilecontents);
|
||
|
$this->assertContains('var1', $mergedfilecontents);
|
||
|
$this->assertContains('value1', $mergedfilecontents);
|
||
|
$this->assertContains('header1', $mergedfilecontents);
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* test_get_pending_files
|
||
|
*
|
||
|
* @return null
|
||
|
*/
|
||
|
public function test_get_pending_files() {
|
||
|
global $DB;
|
||
|
|
||
|
$this->resetAfterTest();
|
||
|
|
||
|
$fakemodelid = 123;
|
||
|
$timesplittingids = array(
|
||
|
'\core\analytics\time_splitting\quarters',
|
||
|
'\core\analytics\time_splitting\quarters_accum',
|
||
|
);
|
||
|
|
||
|
// No files.
|
||
|
$this->assertEmpty(\core_analytics\dataset_manager::get_pending_files($fakemodelid, true, $timesplittingids));
|
||
|
$this->assertEmpty(\core_analytics\dataset_manager::get_pending_files($fakemodelid, false, $timesplittingids));
|
||
|
|
||
|
// We will reuse this analysable file to create training and prediction datasets (analysable level files are
|
||
|
// merged into training and prediction files).
|
||
|
$analysabledataset = new \core_analytics\dataset_manager($fakemodelid, 1, 'whatever',
|
||
|
\core_analytics\dataset_manager::LABELLED_FILEAREA, false);
|
||
|
$analysabledatasetdata = array_merge($this->sharedtoprows, array(array('yeah', 'yeah', 'yeah')));
|
||
|
$file = $analysabledataset->store($analysabledatasetdata);
|
||
|
|
||
|
// Evaluation files ignored.
|
||
|
$evaluationdataset = \core_analytics\dataset_manager::merge_datasets(array($file), $fakemodelid,
|
||
|
'\core\analytics\time_splitting\quarters', \core_analytics\dataset_manager::LABELLED_FILEAREA, true);
|
||
|
|
||
|
$this->assertEmpty(\core_analytics\dataset_manager::get_pending_files($fakemodelid, true, $timesplittingids));
|
||
|
$this->assertEmpty(\core_analytics\dataset_manager::get_pending_files($fakemodelid, false, $timesplittingids));
|
||
|
|
||
|
// Training and prediction files are not mixed up.
|
||
|
$trainingfile1 = \core_analytics\dataset_manager::merge_datasets(array($file), $fakemodelid,
|
||
|
'\core\analytics\time_splitting\quarters', \core_analytics\dataset_manager::LABELLED_FILEAREA, false);
|
||
|
$this->waitForSecond();
|
||
|
$trainingfile2 = \core_analytics\dataset_manager::merge_datasets(array($file), $fakemodelid,
|
||
|
'\core\analytics\time_splitting\quarters', \core_analytics\dataset_manager::LABELLED_FILEAREA, false);
|
||
|
|
||
|
$bytimesplitting = \core_analytics\dataset_manager::get_pending_files($fakemodelid, true, $timesplittingids);
|
||
|
$this->assertFalse(isset($bytimesplitting['\core\analytics\time_splitting\quarters_accum']));
|
||
|
$this->assertCount(2, $bytimesplitting['\core\analytics\time_splitting\quarters']);
|
||
|
$this->assertEmpty(\core_analytics\dataset_manager::get_pending_files($fakemodelid, false, $timesplittingids));
|
||
|
|
||
|
$predictionfile = \core_analytics\dataset_manager::merge_datasets(array($file), $fakemodelid,
|
||
|
'\core\analytics\time_splitting\quarters', \core_analytics\dataset_manager::UNLABELLED_FILEAREA, false);
|
||
|
$bytimesplitting = \core_analytics\dataset_manager::get_pending_files($fakemodelid, false, $timesplittingids);
|
||
|
$this->assertFalse(isset($bytimesplitting['\core\analytics\time_splitting\quarters_accum']));
|
||
|
$this->assertCount(1, $bytimesplitting['\core\analytics\time_splitting\quarters']);
|
||
|
|
||
|
// Already used for training and prediction are discarded.
|
||
|
$usedfile = (object)['modelid' => $fakemodelid, 'fileid' => $trainingfile1->get_id(), 'action' => 'trained',
|
||
|
'time' => time()];
|
||
|
$DB->insert_record('analytics_used_files', $usedfile);
|
||
|
$bytimesplitting = \core_analytics\dataset_manager::get_pending_files($fakemodelid, true, $timesplittingids);
|
||
|
$this->assertCount(1, $bytimesplitting['\core\analytics\time_splitting\quarters']);
|
||
|
|
||
|
$usedfile->fileid = $predictionfile->get_id();
|
||
|
$usedfile->action = 'predicted';
|
||
|
$DB->insert_record('analytics_used_files', $usedfile);
|
||
|
$this->assertEmpty(\core_analytics\dataset_manager::get_pending_files($fakemodelid, false, $timesplittingids));
|
||
|
}
|
||
|
}
|