sql-machine-learning
diff --git a/‎go/codegen/pai/template_tf.go‎
Lines changed: 3 additions & 3 deletions b/‎go/codegen/pai/template_tf.go‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎go/codegen/tensorflow/template_train.go‎
Lines changed: 1 addition & 1 deletion b/‎go/codegen/tensorflow/template_train.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎python/runtime/dbapi/connection.py‎
Lines changed: 5 additions & 3 deletions b/‎python/runtime/dbapi/connection.py‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎python/runtime/dbapi/maxcompute.py‎
Lines changed: 1 addition & 1 deletion b/‎python/runtime/dbapi/maxcompute.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎python/runtime/local/submitter.py‎
Lines changed: 8 additions & 3 deletions b/‎python/runtime/local/submitter.py‎
Lines changed: 8 additions & 3 deletions
diff --git a/‎python/runtime/pai/__init__.py‎
Lines changed: 4 additions & 4 deletions b/‎python/runtime/pai/__init__.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎python/runtime/pai/create_result_table.py‎
Lines changed: 151 additions & 0 deletions b/‎python/runtime/pai/create_result_table.py‎
Lines changed: 151 additions & 0 deletions
diff --git a/‎python/runtime/pai/entry.py‎
Lines changed: 8 additions & 8 deletions b/‎python/runtime/pai/entry.py‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎python/runtime/pai/get_pai_tf_cmd.py‎
Lines changed: 111 additions & 0 deletions b/‎python/runtime/pai/get_pai_tf_cmd.py‎
Lines changed: 111 additions & 0 deletions
diff --git a/‎python/runtime/pai/tensorflow/__init__.py‎ ‎python/runtime/pai/pai_ml/__init__.py‎python/runtime/pai/tensorflow/__init__.py renamed to python/runtime/pai/pai_ml/__init__.py b/‎python/runtime/pai/tensorflow/__init__.py‎ ‎python/runtime/pai/pai_ml/__init__.py‎python/runtime/pai/tensorflow/__init__.py renamed to python/runtime/pai/pai_ml/__init__.py
@@ -113,7 +113,7 @@ const tfPredictTmplText = tfImportsText + `
 import os
 import types
 import traceback
-from runtime.pai.tensorflow import predict
+from runtime.pai.tensorflow_submitter import predict
 
 try:
     import sqlflow_models
@@ -178,7 +178,7 @@ if os.environ.get('DISPLAY', '') == '':
 import json
 import types
 import sys
-from runtime.pai.tensorflow import explain
+from runtime.pai.tensorflow_submitter import explain
 
 try:
     tf.enable_eager_execution()
@@ -241,7 +241,7 @@ if os.environ.get('DISPLAY', '') == '':
 import json
 import types
 import sys
-from runtime.pai.tensorflow import evaluate
+from runtime.pai.tensorflow_submitter import evaluate
 
 try:
     tf.enable_eager_execution()
 
@@ -42,7 +42,7 @@ import traceback
 import tensorflow as tf
 import runtime
 {{ if .IsPAI }}
-from runtime.pai.tensorflow.train import train
+from runtime.pai.tensorflow_submitter.train import train
 {{ else }}
 from runtime.tensorflow.train import train
 {{ end }}
 
@@ -166,13 +166,15 @@ def execute(self, statement):
         Returns:
             True on success, False otherwise
         """
+        rs = None
         try:
             rs = self._get_result_set(statement)
             return rs.success()
-        except:  # noqa: E722
-            return False
+        except Exception as e:  # noqa: E722
+            raise e
         finally:
-            rs.close()
+            if rs:
+                rs.close()
 
     def get_table_schema(self, table_name):
         """Get table schema for given table
 
@@ -116,7 +116,7 @@ def _get_result_set(self, statement):
             instance = self._conn.execute_sql(statement)
             return MaxComputeResultSet(instance)
         except Exception as e:
-            return MaxComputeResultSet(None, str(e))
+            raise e
 
     def close(self):
         if self._conn:
 
@@ -36,9 +36,14 @@ def submit_local_train(datasource, estimator_string, select, validation_select,
             The pre-trained model name to load
         train_params: dict
             Extra train params, will be passed to runtime.tensorflow.train
-            or runtime.xgboost.train, required fields: original_sql,
-            model_image, feature_column_map, label_column; optional fields:
-            disk_cache, batch_size, epoch.
+            or runtime.xgboost.train. Required fields:
+            - original_sql: Original SQLFlow statement.
+            - model_image: Docker image used for training.
+            - feature_column_map: A map of Python feature column IR.
+            - label_column: Feature column instance describing the label.
+            - disk_cache (optional): Use dmatrix disk cache if True.
+            - batch_size (optional): Split data to batches and train.
+            - epoch (optional): Epochs to train.
     """
     if estimator_string.lower().startswith("xgboost"):
         # pop required params from train_params
 
@@ -11,7 +11,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from runtime.pai.submitter import submit_pai_evaluate as evaluate  # noqa: F401
-from runtime.pai.submitter import submit_pai_explain as explain  # noqa: F401
-from runtime.pai.submitter import submit_pai_predict as predict  # noqa: F401
-from runtime.pai.submitter import submit_pai_train as train  # noqa: F401
+from runtime.pai.submitter_evaluate import submit_pai_evaluate as evaluate  # noqa
+from runtime.pai.submitter_explain import submit_pai_explain as explain  # noqa
+from runtime.pai.submitter_predict import submit_pai_predict as predict  # noqa
+from runtime.pai.submitter_train import submit_pai_train as train  # noqa
@@ -0,0 +1,151 @@
+# Copyright 2020 The SQLFlow Authors. All rights reserved.
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from runtime import db
+from runtime.diagnostics import SQLFlowDiagnostic
+from runtime.model import EstimatorType
+from runtime.pai import table_ops
+
+
+def create_predict_result_table(datasource, select, result_table, label_column,
+                                train_label_column, model_type):
+    """Create predict result table with given name and label column
+
+    Args:
+        datasource: current datasource
+        select: sql statement to get prediction data set
+        result_table: the table name to save result
+        label_column: name of the label column, if not exist in select
+            result, we will add a int column in the result table
+        train_label_column: name of the label column when training
+        model_type: type of model defined in runtime.model.oss
+    """
+    conn = db.connect_with_data_source(datasource)
+    conn.execute("DROP TABLE IF EXISTS %s" % result_table)
+    # PAI ml will create result table itself
+    if model_type == EstimatorType.PAIML:
+        return
+
+    create_table_sql = "CREATE TABLE %s AS SELECT * FROM %s LIMIT 0" % (
+        result_table, select)
+    conn.execute(create_table_sql)
+
+    # if label is not in data table, add a int column for it
+    schema = db.get_table_schema(conn, result_table)
+    col_type = "INT"
+    for (name, ctype) in schema:
+        if name == train_label_column or name == label_column:
+            col_type = ctype
+            break
+    col_names = [col[0] for col in schema]
+    if label_column not in col_names:
+        conn.execute(
+            conn, "ALTER TABLE %s ADD %s %s" %
+            (result_table, label_column, col_type))
+    if train_label_column != label_column and train_label_column in col_names:
+        conn.execute(
+            conn, "ALTER TABLE %s DROP COLUMN %s" %
+            (result_table, train_label_column))
+
+
+# (TODO: lhw) This function is a common tool for prediction
+# on all platforms, we need to move it to a new file
+def create_explain_result_table(datasource, data_table, result_table,
+                                model_type, estimator, label_column):
+    """Create explain result table from given datasource
+
+    Args:
+        datasource: current datasource
+        data_table: input data table name
+        result_table: table name to store the result
+        model_type: type of the model to use
+        estimator: estimator class if the model is TensorFlow estimator
+        label_column: column name of the predict label
+    """
+    conn = db.connect_with_data_source(datasource)
+    drop_stmt = "DROP TABLE IF EXISTS %s" % result_table
+    conn.execute(drop_stmt)
+
+    create_stmt = ""
+    if model_type == EstimatorType.PAIML:
+        return
+    elif model_type == EstimatorType.TENSORFLOW:
+        if estimator.startswith("BoostedTrees"):
+            column_def = ""
+            if conn.driver == "mysql":
+                column_def = "(feature VARCHAR(255), dfc FLOAT, gain FLOAT)"
+            else:
+                # Hive & MaxCompute
+                column_def = "(feature STRING, dfc STRING, gain STRING)"
+            create_stmt = "CREATE TABLE IF NOT EXISTS %s %s;" % (result_table,
+                                                                 column_def)
+        else:
+            if not label_column:
+                raise SQLFlowDiagnostic(
+                    "need to specify WITH label_col=lable_col_name "
+                    "when explaining deep models")
+            create_stmt = get_create_shap_result_sql(conn, data_table,
+                                                     result_table,
+                                                     label_column)
+    elif model_type == EstimatorType.XGBOOST:
+        if not label_column:
+            raise SQLFlowDiagnostic(
+                "need to specify WITH label_col=lable_col_name "
+                "when explaining xgboost models")
+        create_stmt = get_create_shap_result_sql(conn, data_table,
+                                                 result_table, label_column)
+    else:
+        raise SQLFlowDiagnostic(
+            "not supported modelType %d for creating Explain result table" %
+            model_type)
+
+    if not conn.execute(create_stmt):
+        raise SQLFlowDiagnostic("Can't create explain result table")
+
+
+def get_create_shap_result_sql(conn, data_table, result_table, label_column):
+    """Get a sql statement which create a result table for SHAP
+
+    Args:
+        conn: a database connection
+        data_table: table name to read data from
+        result_table: result table name
+        label_column: column name of label
+
+    Returns:
+        a sql statement to create SHAP result table
+    """
+    schema = db.get_table_schema(conn, data_table)
+    fields = ["%s STRING" % f[0] for f in schema if f[0] != label_column]
+    return "CREATE TABLE IF NOT EXISTS %s (%s)" % (result_table,
+                                                   ",".join(fields))
+
+
+def create_evaluate_result_table(datasource, result_table, metrics):
+    """Create a table to hold the evaluation result
+
+    Args:
+        datasource: current datasource
+        result_table: the table name to save result
+        metrics: list of evaluation metrics names
+    """
+    table_ops.drop_tables([result_table], datasource)
+    # Always add loss
+    ext_metrics = ["loss"]
+    if isinstance(metrics, list):
+        ext_metrics.extend(metrics)
+    fields = ["%s STRING" % m for m in ext_metrics]
+    sql = "CREATE TABLE IF NOT EXISTS %s (%s);" % (result_table,
+                                                   ",".join(fields))
+    conn = db.connect_with_data_source(datasource)
+    conn.execute(sql)
@@ -16,18 +16,18 @@
 
 from runtime.diagnostics import SQLFlowDiagnostic
 from runtime.pai.pai_distributed import define_tf_flags, set_oss_environs
-from runtime.pai.tensorflow.evaluate import evaluate as evaluate_tf
-from runtime.pai.tensorflow.explain import explain as explain_tf
-from runtime.pai.tensorflow.predict import predict as predict_tf
-from runtime.pai.tensorflow.train import train as train_tf
+from runtime.pai.tensorflow_submitter.evaluate import evaluate as evaluate_tf
+from runtime.pai.tensorflow_submitter.explain import explain as explain_tf
+from runtime.pai.tensorflow_submitter.predict import predict as predict_tf
+from runtime.pai.tensorflow_submitter.train import train as train_tf
 
 try:
     # (TODO: lhw) split entry.py into multiple files,
     # so, we can only import needed packages
-    from runtime.pai.xgboost.predict import predict as predict_xgb
-    from runtime.pai.xgboost.train import train as train_xgb
-    from runtime.pai.xgboost.explain import explain as explain_xgb
-    from runtime.pai.xgboost.evaluate import evaluate as evaluate_xgb
+    from runtime.pai.xgboost_submitter.predict import predict as predict_xgb
+    from runtime.pai.xgboost_submitter.train import train as train_xgb
+    from runtime.pai.xgboost_submitter.explain import explain as explain_xgb
+    from runtime.pai.xgboost_submitter.evaluate import evaluate as evaluate_xgb
 except:  # noqa: E722
     pass
 
 
@@ -0,0 +1,111 @@
+# Copyright 2020 The SQLFlow Authors. All rights reserved.
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import os
+import string
+
+from runtime.diagnostics import SQLFlowDiagnostic
+from runtime.pai import pai_model
+
+JOB_ARCHIVE_FILE = "job.tar.gz"
+PARAMS_FILE = "params.txt"
+ENTRY_FILE = "entry.py"
+
+
+def get_pai_tf_cmd(cluster_config, tarball, params_file, entry_file,
+                   model_name, oss_model_path, train_table, val_table,
+                   res_table, project):
+    """Get PAI-TF cmd for training
+
+    Args:
+        cluster_config: PAI cluster config
+        tarball: the zipped resource name
+        params_file: PAI param file name
+        entry_file: entry file in the tarball
+        model_name: trained model name
+        oss_model_path: path to save the model
+        train_table: train data table
+        val_table: evaluate data table
+        res_table: table to save train model, if given
+        project: current odps project
+
+    Retruns:
+        The cmd to run on PAI
+    """
+    job_name = "_".join(["sqlflow", model_name]).replace(".", "_")
+    cf_quote = json.dumps(cluster_config).replace("\"", "\\\"")
+
+    # submit table should format as: odps://<project>/tables/<table >,
+    # odps://<project>/tables/<table > ...
+    submit_tables = _max_compute_table_url(train_table)
+    if train_table != val_table and val_table:
+        val_table = _max_compute_table_url(val_table)
+        submit_tables = "%s,%s" % (submit_tables, val_table)
+    output_tables = ""
+    if res_table != "":
+        table = _max_compute_table_url(res_table)
+        output_tables = "-Doutputs=%s" % table
+
+    # NOTE(typhoonzero): use - DhyperParameters to define flags passing
+    # OSS credentials.
+    # TODO(typhoonzero): need to find a more secure way to pass credentials.
+    cmd = ("pai -name tensorflow1150 -project algo_public_dev "
+           "-DmaxHungTimeBeforeGCInSeconds=0 -DjobName=%s -Dtags=dnn "
+           "-Dscript=%s -DentryFile=%s -Dtables=%s %s -DhyperParameters='%s'"
+           ) % (job_name, tarball, entry_file, submit_tables, output_tables,
+                params_file)
+
+    # format the oss checkpoint path with ARN authorization.
+    oss_checkpoint_configs = os.getenv("SQLFLOW_OSS_CHECKPOINT_CONFIG")
+    if not oss_checkpoint_configs:
+        raise SQLFlowDiagnostic(
+            "need to configure SQLFLOW_OSS_CHECKPOINT_CONFIG when "
+            "submitting to PAI")
+    ckpt_conf = json.loads(oss_checkpoint_configs)
+    model_url = pai_model.get_oss_model_url(oss_model_path)
+    role_name = _get_project_role_name(project)
+    # format the oss checkpoint path with ARN authorization.
+    oss_checkpoint_path = "%s/?role_arn=%s/%s&host=%s" % (
+        model_url, ckpt_conf["arn"], role_name, ckpt_conf["host"])
+    cmd = "%s -DcheckpointDir='%s'" % (cmd, oss_checkpoint_path)
+
+    if cluster_config["worker"]["count"] > 1:
+        cmd = "%s -Dcluster=\"%s\"" % (cmd, cf_quote)
+    else:
+        cmd = "%s -DgpuRequired='%d'" % (cmd, cluster_config["worker"]["gpu"])
+    return cmd
+
+
+def _get_project_role_name(project):
+    """Get oss role form project name.
+    A valid role name contains letters and numbers only.
+    The prefix 'pai2oss' of the role name denotes PAI access OS
+
+    Args:
+        project: string
+            project name
+
+    Returns:
+        role name for the project
+    """
+    return "pai2oss" + "".join(x for x in project.lower()
+                               if x in string.ascii_lowercase + string.digits)
+
+
+def _max_compute_table_url(table):
+    parts = table.split(".")
+    if len(parts) != 2:
+        raise SQLFlowDiagnostic("odps table: %s should be format db.table" %
+                                table)
+    return "odps://%s/tables/%s" % (parts[0], parts[1])