Search moodle.org's
Developer Documentation

See Release Notes

  • Bug fixes for general core bugs in 3.11.x will end 14 Nov 2022 (12 months plus 6 months extension).
  • Bug fixes for security issues in 3.11.x will end 13 Nov 2023 (18 months plus 12 months extension).
  • PHP version: minimum PHP 7.3.0 Note: minimum PHP version has increased since Moodle 3.10. PHP 7.4.x is supported too.
<?php
// This file is part of Moodle - http://moodle.org/
//
// Moodle is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
//
// Moodle is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with Moodle.  If not, see <http://www.gnu.org/licenses/>.

/**
 * Python predictions processor
 *
 * @package   mlbackend_python
 * @copyright 2016 David Monllao {@link http://www.davidmonllao.com}
 * @license   http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
 */

namespace mlbackend_python;

defined('MOODLE_INTERNAL') || die();

/**
 * Python predictions processor.
 *
 * @package   mlbackend_python
 * @copyright 2016 David Monllao {@link http://www.davidmonllao.com}
 * @license   http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
 */
class processor implements  \core_analytics\classifier, \core_analytics\regressor, \core_analytics\packable {

    /**
     * The required version of the python package that performs all calculations.
     */
    const REQUIRED_PIP_PACKAGE_VERSION = '2.6.6';

    /**
     * The python package is installed in a server.
     * @var bool
     */
    protected $useserver;

    /**
     * The path to the Python bin.
     *
     * @var string
     */
    protected $pathtopython;

    /**
     * Remote server host
     * @var string
     */
    protected $host;

    /**
     * Remote server port
     * @var int
     */
    protected $port;

    /**
     * Whether to use http or https.
     * @var bool
     */
    protected $secure;

    /**
     * Server username.
     * @var string
     */
    protected $username;

    /**
     * Server password for $this->username.
     * @var string
     */
    protected $password;

    /**
     * The constructor.
     *
     */
    public function __construct() {
        global $CFG;

        $config = get_config('mlbackend_python');

        $this->useserver = !empty($config->useserver);

        if (!$this->useserver) {
            // Set the python location if there is a value.
            if (!empty($CFG->pathtopython)) {
                $this->pathtopython = $CFG->pathtopython;
            }
        } else {
            $this->host = $config->host ?? '';
            $this->port = $config->port ?? '';
            $this->secure = $config->secure ?? false;
            $this->username = $config->username ?? '';
            $this->password = $config->password ?? '';
        }
    }

    /**
     * Is the plugin ready to be used?.
     *
     * @return bool|string Returns true on success, a string detailing the error otherwise
     */
    public function is_ready() {

        if (!$this->useserver) {
            return $this->is_webserver_ready();
        } else {
            return $this->is_python_server_ready();
        }
    }

    /**
     * Checks if the python package is available in the web server executing this script.
     *
     * @return bool|string Returns true on success, a string detailing the error otherwise
     */
    protected function is_webserver_ready() {
        if (empty($this->pathtopython)) {
            $settingurl = new \moodle_url('/admin/settings.php', array('section' => 'systempaths'));
            return get_string('pythonpathnotdefined', 'mlbackend_python', $settingurl->out());
        }

        // Check the installed pip package version.
        $cmd = "{$this->pathtopython} -m moodlemlbackend.version";

        $output = null;
        $exitcode = null;
        // Execute it sending the standard error to $output.
        $result = exec($cmd . ' 2>&1', $output, $exitcode);

        if ($exitcode != 0) {
            return get_string('pythonpackagenotinstalled', 'mlbackend_python', $cmd);
        }

        $vercheck = self::check_pip_package_version($result);
        return $this->version_check_return($result, $vercheck);
    }

    /**
     * Checks if the server can be accessed.
     *
     * @return bool|string True or an error string.
     */
    protected function is_python_server_ready() {

        if (empty($this->host) || empty($this->port) || empty($this->username) || empty($this->password)) {
            return get_string('errornoconfigdata', 'mlbackend_python');
        }

        // Connection is allowed to use 'localhost' and other potentially blocked hosts/ports.
        $curl = new \curl(['ignoresecurity' => true]);
        $responsebody = $curl->get($this->get_server_url('version')->out(false));
        if ($curl->info['http_code'] !== 200) {
            return get_string('errorserver', 'mlbackend_python', $this->server_error_str($curl->info['http_code'], $responsebody));
        }

        $vercheck = self::check_pip_package_version($responsebody);
        return $this->version_check_return($responsebody, $vercheck);

    }

    /**
     * Delete the model version output directory.
     *
     * @throws \moodle_exception
     * @param string $uniqueid
     * @param string $modelversionoutputdir
     * @return null
     */
    public function clear_model($uniqueid, $modelversionoutputdir) {
        if (!$this->useserver) {
            remove_dir($modelversionoutputdir);
        } else {
            // Use the server.

            $url = $this->get_server_url('deletemodel');
            list($responsebody, $httpcode) = $this->server_request($url, 'post', ['uniqueid' => $uniqueid]);
        }
    }

    /**
     * Delete the model output directory.
     *
     * @throws \moodle_exception
     * @param string $modeloutputdir
     * @param string $uniqueid
     * @return null
     */
    public function delete_output_dir($modeloutputdir, $uniqueid) {
        if (!$this->useserver) {
            remove_dir($modeloutputdir);
        } else {

            $url = $this->get_server_url('deletemodel');
            list($responsebody, $httpcode) = $this->server_request($url, 'post', ['uniqueid' => $uniqueid]);
        }
    }

    /**
     * Trains a machine learning algorithm with the provided dataset.
     *
     * @param string $uniqueid
     * @param \stored_file $dataset
     * @param string $outputdir
     * @return \stdClass
     */
    public function train_classification($uniqueid, \stored_file $dataset, $outputdir) {

        if (!$this->useserver) {
            // Use the local file system.

            list($result, $exitcode) = $this->exec_command('training', [$uniqueid, $outputdir,
                $this->get_file_path($dataset)], 'errornopredictresults');

        } else {
            // Use the server.

            $requestparams = ['uniqueid' => $uniqueid, 'dirhash' => $this->hash_dir($outputdir),
                'dataset' => $dataset];

            $url = $this->get_server_url('training');
            list($result, $httpcode) = $this->server_request($url, 'post', $requestparams);
        }

        if (!$resultobj = json_decode($result)) {
            throw new \moodle_exception('errorpredictwrongformat', 'analytics', '', json_last_error_msg());
        }

        if ($resultobj->status != 0) {
            $resultobj = $this->format_error_info($resultobj);
        }

        return $resultobj;
    }

    /**
     * Classifies the provided dataset samples.
     *
     * @param string $uniqueid
     * @param \stored_file $dataset
     * @param string $outputdir
     * @return \stdClass
     */
    public function classify($uniqueid, \stored_file $dataset, $outputdir) {

        if (!$this->useserver) {
            // Use the local file system.

            list($result, $exitcode) = $this->exec_command('prediction', [$uniqueid, $outputdir,
                $this->get_file_path($dataset)], 'errornopredictresults');

        } else {
            // Use the server.

            $requestparams = ['uniqueid' => $uniqueid, 'dirhash' => $this->hash_dir($outputdir),
                'dataset' => $dataset];

            $url = $this->get_server_url('prediction');
            list($result, $httpcode) = $this->server_request($url, 'post', $requestparams);
        }

        if (!$resultobj = json_decode($result)) {
            throw new \moodle_exception('errorpredictwrongformat', 'analytics', '', json_last_error_msg());
        }

<
if ($resultobj->status != 0) { $resultobj = $this->format_error_info($resultobj); } return $resultobj; } /** * Evaluates this processor classification model using the provided supervised learning dataset. * * @param string $uniqueid * @param float $maxdeviation * @param int $niterations * @param \stored_file $dataset * @param string $outputdir * @param string $trainedmodeldir * @return \stdClass */ public function evaluate_classification($uniqueid, $maxdeviation, $niterations, \stored_file $dataset, $outputdir, $trainedmodeldir) { global $CFG; if (!$this->useserver) { // Use the local file system. $datasetpath = $this->get_file_path($dataset); $params = [$uniqueid, $outputdir, $datasetpath, \core_analytics\model::MIN_SCORE, $maxdeviation, $niterations]; if ($trainedmodeldir) { $params[] = $trainedmodeldir; } list($result, $exitcode) = $this->exec_command('evaluation', $params, 'errornopredictresults'); if (!$resultobj = json_decode($result)) { throw new \moodle_exception('errorpredictwrongformat', 'analytics', '', json_last_error_msg()); } } else { // Use the server. $requestparams = ['uniqueid' => $uniqueid, 'minscore' => \core_analytics\model::MIN_SCORE, 'maxdeviation' => $maxdeviation, 'niterations' => $niterations, 'dirhash' => $this->hash_dir($outputdir), 'dataset' => $dataset]; if ($trainedmodeldir) { $requestparams['trainedmodeldirhash'] = $this->hash_dir($trainedmodeldir); } $url = $this->get_server_url('evaluation'); list($result, $httpcode) = $this->server_request($url, 'post', $requestparams); if (!$resultobj = json_decode($result)) { throw new \moodle_exception('errorpredictwrongformat', 'analytics', '', json_last_error_msg()); } // We need an extra request to get the resources generated during the evaluation process. // Directory to temporarly store the evaluation log zip returned by the server.
< $evaluationtmpdir = make_request_directory('mlbackend_python_evaluationlog');
> $evaluationtmpdir = make_request_directory();
$evaluationzippath = $evaluationtmpdir . DIRECTORY_SEPARATOR . 'evaluationlog.zip'; $requestparams = ['uniqueid' => $uniqueid, 'dirhash' => $this->hash_dir($outputdir), 'runid' => $resultobj->runid]; $url = $this->get_server_url('evaluationlog'); list($result, $httpcode) = $this->server_request($url, 'download_one', $requestparams, ['filepath' => $evaluationzippath]); $rundir = $outputdir . DIRECTORY_SEPARATOR . 'logs' . DIRECTORY_SEPARATOR . $resultobj->runid; if (!mkdir($rundir, $CFG->directorypermissions, true)) { throw new \moodle_exception('errorexportmodelresult', 'analytics'); } $zip = new \zip_packer(); $success = $zip->extract_to_pathname($evaluationzippath, $rundir, null, null, true); if (!$success) { $a = 'The evaluation files can not be exported to ' . $rundir; throw new \moodle_exception('errorpredictionsprocessor', 'analytics', '', $a); } $resultobj->dir = $rundir; } $resultobj = $this->add_extra_result_info($resultobj); return $resultobj; } /** * Exports the machine learning model. * * @throws \moodle_exception * @param string $uniqueid The model unique id * @param string $modeldir The directory that contains the trained model. * @return string The path to the directory that contains the exported model. */ public function export(string $uniqueid, string $modeldir) : string {
< $exporttmpdir = make_request_directory('mlbackend_python_export');
> $exporttmpdir = make_request_directory();
if (!$this->useserver) { // Use the local file system. // We include an exporttmpdir as we want to be sure that the file is not deleted after the // python process finishes. list($exportdir, $exitcode) = $this->exec_command('export', [$uniqueid, $modeldir, $exporttmpdir], 'errorexportmodelresult'); if ($exitcode != 0) { throw new \moodle_exception('errorexportmodelresult', 'analytics'); } } else { // Use the server. $requestparams = ['uniqueid' => $uniqueid, 'dirhash' => $this->hash_dir($modeldir)]; $exportzippath = $exporttmpdir . DIRECTORY_SEPARATOR . 'export.zip'; $url = $this->get_server_url('export'); list($result, $httpcode) = $this->server_request($url, 'download_one', $requestparams, ['filepath' => $exportzippath]); $exportdir = make_request_directory(); $zip = new \zip_packer(); $success = $zip->extract_to_pathname($exportzippath, $exportdir, null, null, true); if (!$success) { throw new \moodle_exception('errorexportmodelresult', 'analytics'); } } return $exportdir; } /** * Imports the provided machine learning model. * * @param string $uniqueid The model unique id * @param string $modeldir The directory that will contain the trained model. * @param string $importdir The directory that contains the files to import. * @return bool Success */ public function import(string $uniqueid, string $modeldir, string $importdir) : bool { if (!$this->useserver) { // Use the local file system. list($result, $exitcode) = $this->exec_command('import', [$uniqueid, $modeldir, $importdir], 'errorimportmodelresult'); if ($exitcode != 0) { throw new \moodle_exception('errorimportmodelresult', 'analytics'); } } else { // Use the server. // Zip the $importdir to send a single file. $importzipfile = $this->zip_dir($importdir); if (!$importzipfile) { // There was an error zipping the directory. throw new \moodle_exception('errorimportmodelresult', 'analytics'); } $requestparams = ['uniqueid' => $uniqueid, 'dirhash' => $this->hash_dir($modeldir), 'importzip' => curl_file_create($importzipfile, null, 'import.zip')]; $url = $this->get_server_url('import'); list($result, $httpcode) = $this->server_request($url, 'post', $requestparams); } return (bool)$result; } /** * Train this processor regression model using the provided supervised learning dataset. * * @throws new \coding_exception * @param string $uniqueid * @param \stored_file $dataset * @param string $outputdir * @return \stdClass */ public function train_regression($uniqueid, \stored_file $dataset, $outputdir) { throw new \coding_exception('This predictor does not support regression yet.'); } /** * Estimates linear values for the provided dataset samples. * * @throws new \coding_exception * @param string $uniqueid * @param \stored_file $dataset * @param mixed $outputdir * @return void */ public function estimate($uniqueid, \stored_file $dataset, $outputdir) { throw new \coding_exception('This predictor does not support regression yet.'); } /** * Evaluates this processor regression model using the provided supervised learning dataset. * * @throws new \coding_exception * @param string $uniqueid * @param float $maxdeviation * @param int $niterations * @param \stored_file $dataset * @param string $outputdir * @param string $trainedmodeldir * @return \stdClass */ public function evaluate_regression($uniqueid, $maxdeviation, $niterations, \stored_file $dataset, $outputdir, $trainedmodeldir) { throw new \coding_exception('This predictor does not support regression yet.'); } /** * Returns the path to the dataset file. * * @param \stored_file $file * @return string */ protected function get_file_path(\stored_file $file) { // From moodle filesystem to the local file system. // This is not ideal, but there is no read access to moodle filesystem files. return $file->copy_content_to_temp('core_analytics'); } /** * Check that the given package version can be used and return the error status. * * When evaluating the version, we assume the sematic versioning scheme as described at * https://semver.org/. * * @param string $actual The actual Python package version * @param string $required The required version of the package * @return int -1 = actual version is too low, 1 = actual version too high, 0 = actual version is ok */ public static function check_pip_package_version($actual, $required = self::REQUIRED_PIP_PACKAGE_VERSION) { if (empty($actual)) { return -1; } if (version_compare($actual, $required, '<')) { return -1; } $parts = explode('.', $required); $requiredapiver = reset($parts); $parts = explode('.', $actual); $actualapiver = reset($parts); if ($requiredapiver > 0 || $actualapiver > 1) { if (version_compare($actual, $requiredapiver + 1, '>=')) { return 1; } } return 0; } /** * Executes the specified module. * * @param string $modulename * @param array $params * @param string $errorlangstr * @return array [0] is the result body and [1] the exit code. */ protected function exec_command(string $modulename, array $params, string $errorlangstr) { $cmd = $this->pathtopython . ' -m moodlemlbackend.' . $modulename . ' '; foreach ($params as $param) { $cmd .= escapeshellarg($param) . ' '; } if (!PHPUNIT_TEST && CLI_SCRIPT) { debugging($cmd, DEBUG_DEVELOPER); } $output = null; $exitcode = null; $result = exec($cmd, $output, $exitcode); if (!$result) { throw new \moodle_exception($errorlangstr, 'analytics'); } return [$result, $exitcode]; } /** * Formats the errors and info in a single info string. * * @param \stdClass $resultobj * @return \stdClass */ private function format_error_info(\stdClass $resultobj) { if (!empty($resultobj->errors)) { $errors = $resultobj->errors; if (is_array($errors)) { $errors = implode(', ', $errors); } } else if (!empty($resultobj->info)) { // Show info if no errors are returned. $errors = $resultobj->info; if (is_array($errors)) { $errors = implode(', ', $errors); } } $resultobj->info = array(get_string('errorpredictionsprocessor', 'analytics', $errors)); return $resultobj; } /** * Returns the url to the python ML server. * * @param string|null $path * @return \moodle_url */ private function get_server_url(?string $path = null) { $protocol = !empty($this->secure) ? 'https' : 'http'; $url = $protocol . '://' . rtrim($this->host, '/'); if (!empty($this->port)) { $url .= ':' . $this->port; } if ($path) { $url .= '/' . $path; } return new \moodle_url($url); } /** * Sends a request to the python ML server. * * @param \moodle_url $url The requested url in the python ML server * @param string $method The curl method to use * @param array $requestparams Curl request params * @param array|null $options Curl request options * @return array [0] for the response body and [1] for the http code */ protected function server_request($url, string $method, array $requestparams, ?array $options = null) { if ($method !== 'post' && $method !== 'get' && $method !== 'download_one') { throw new \coding_exception('Incorrect request method provided. Only "get", "post" and "download_one" actions are available.'); } // Connection is allowed to use 'localhost' and other potentially blocked hosts/ports. $curl = new \curl(['ignoresecurity' => true]); $authorization = $this->username . ':' . $this->password; $curl->setHeader('Authorization: Basic ' . base64_encode($authorization)); $responsebody = $curl->{$method}($url, $requestparams, $options); if ($curl->info['http_code'] !== 200) { throw new \moodle_exception('errorserver', 'mlbackend_python', '', $this->server_error_str($curl->info['http_code'], $responsebody)); } return [$responsebody, $curl->info['http_code']]; } /** * Adds extra information to results info. * * @param \stdClass $resultobj * @return \stdClass */ protected function add_extra_result_info(\stdClass $resultobj): \stdClass { if (!empty($resultobj->dir)) { $dir = $resultobj->dir . DIRECTORY_SEPARATOR . 'tensor'; $resultobj->info[] = get_string('tensorboardinfo', 'mlbackend_python', $dir); } return $resultobj; } /** * Returns the proper return value for the version checking. * * @param string $actual Actual moodlemlbackend version * @param int $vercheck Version checking result * @return true|string Returns true on success, a string detailing the error otherwise */ private function version_check_return($actual, $vercheck) { if ($vercheck === 0) { return true; } if ($actual) { $a = [ 'installed' => $actual, 'required' => self::REQUIRED_PIP_PACKAGE_VERSION, ]; if ($vercheck < 0) { return get_string('packageinstalledshouldbe', 'mlbackend_python', $a); } else if ($vercheck > 0) { return get_string('packageinstalledtoohigh', 'mlbackend_python', $a); } } if (!$this->useserver) { $cmd = "{$this->pathtopython} -m moodlemlbackend.version"; } else { // We can't not know which is the python bin in the python ML server, the most likely // value is 'python'. $cmd = "python -m moodlemlbackend.version"; } return get_string('pythonpackagenotinstalled', 'mlbackend_python', $cmd); } /** * Hashes the provided dir as a string. * * @param string $dir Directory path * @return string Hash */ private function hash_dir(string $dir) { return md5($dir); } /** * Zips the provided directory. * * @param string $dir Directory path * @return string The zip filename */ private function zip_dir(string $dir) {
< $ziptmpdir = make_request_directory('mlbackend_python');
> $ziptmpdir = make_request_directory();
$ziptmpfile = $ziptmpdir . DIRECTORY_SEPARATOR . 'mlbackend.zip'; $files = get_directory_list($dir); $zipfiles = []; foreach ($files as $file) { $fullpath = $dir . DIRECTORY_SEPARATOR . $file; // Use the relative path to the file as the path in the zip. $zipfiles[$file] = $fullpath; } $zip = new \zip_packer(); if (!$zip->archive_to_pathname($zipfiles, $ziptmpfile)) { return false; } return $ziptmpfile; } /** * Error string for httpcode !== 200 * * @param int $httpstatuscode The HTTP status code * @param string $responsebody The body of the response */ private function server_error_str(int $httpstatuscode, string $responsebody): string { return 'HTTP status code ' . $httpstatuscode . ': ' . $responsebody; } }