jaor · April 6, 2021 21:53
diff --git a/readme.md b/readme.md
diff --git a/metadata.json b/metadata.json
 {
  "name": "mark-missing-in-predictions",
  "kind": "script",
  "description": "Perform a batch prediction and produce an additional dataset with missings marked",
  "source_code": "script.whizzml",
  "imports":[
    ],
  "inputs":[
    {
      "name": "model",
      "type": "supervised-model-id",
      "description": "The supervised model to use for predictions"
    },
    {
      "name": "dataset",
      "type": "dataset-id",
      "description": "The input dataset"
    },
    {
      "name": "denied-class",
      "type": "string",
      "description": "Class used to denote denied predictions",
      "default": "denied"
    },
    {
      "name": "fields",
      "description": "List of fields to check for missings, or empty for all",
      "type": "list",
      "default": []
    }],
  "outputs":[
    {
      "name": "batch-prediction",
      "type": "batchprediction-id",
      "description": "The full batch prediction"
    },
    {
      "name": "corrected-predictions",
      "description": "The dataset with all predictions, some marked as denied",
      "type": "dataset-id"
    },
    {
      "name": "filtered-predictions",
      "description": "The dataset only with predictions not marked as denied",
      "type": "dataset-id"
    }]
 }
diff --git a/script.whizzml b/script.whizzml

 (define batch-prediction
  (wait (create-batchprediction model dataset {"output_dataset" true
                                               "all_fields" true})))

 (define corrected-predictions
  (let (ds (wait ((fetch batch-prediction) "output_dataset_resource"))
        fds (if (empty? fields) (keys (resource-fields ds)) fields)
        obj (resource-property model "objective_field_name")
        flt (flatline "(if (> (count (filter (missing? _) (list @{{fds}}))) 0)"
                      "  {{denied-class}} (str (f {{obj}})))"))
    (wait (create-dataset ds {"new_fields" [{"field" flt
                                             "name" "corrected-prediction"}]}))))

 (define filtered-predictions
  (let (flt (flatline "(!= {{denied-class}} (f \"corrected-prediction\"))"))
    (wait (create-dataset corrected-predictions
                          {"lisp_filter" flt
                           "excluded_fields" ["corrected-prediction"]}))))
	{
	"name": "mark-missing-in-predictions",
	"kind": "script",
	"description": "Perform a batch prediction and produce an additional dataset with missings marked",
	"source_code": "script.whizzml",
	"imports":[
	],
	"inputs":[
	{
	"name": "model",
	"type": "supervised-model-id",
	"description": "The supervised model to use for predictions"
	},
	{
	"name": "dataset",
	"type": "dataset-id",
	"description": "The input dataset"
	},
	{
	"name": "denied-class",
	"type": "string",
	"description": "Class used to denote denied predictions",
	"default": "denied"
	},
	{
	"name": "fields",
	"description": "List of fields to check for missings, or empty for all",
	"type": "list",
	"default": []
	}],
	"outputs":[
	{
	"name": "batch-prediction",
	"type": "batchprediction-id",
	"description": "The full batch prediction"
	},
	{
	"name": "corrected-predictions",
	"description": "The dataset with all predictions, some marked as denied",
	"type": "dataset-id"
	},
	{
	"name": "filtered-predictions",
	"description": "The dataset only with predictions not marked as denied",
	"type": "dataset-id"
	}]
	}

	(define batch-prediction
	(wait (create-batchprediction model dataset {"output_dataset" true
	"all_fields" true})))

	(define corrected-predictions
	(let (ds (wait ((fetch batch-prediction) "output_dataset_resource"))
	fds (if (empty? fields) (keys (resource-fields ds)) fields)
	obj (resource-property model "objective_field_name")
	flt (flatline "(if (> (count (filter (missing? _) (list @{{fds}}))) 0)"
	" {{denied-class}} (str (f {{obj}})))"))
	(wait (create-dataset ds {"new_fields" [{"field" flt
	"name" "corrected-prediction"}]}))))

	(define filtered-predictions
	(let (flt (flatline "(!= {{denied-class}} (f \"corrected-prediction\"))"))
	(wait (create-dataset corrected-predictions
	{"lisp_filter" flt
	"excluded_fields" ["corrected-prediction"]}))))