Name: Demo-data-exploration
Version: 26
Creator: Florian_Dietz
This starts Rule a major series of tasks, each dependent on each other.
The purpose of this Rule is the initial exploration of the content of a table.
1. Acquire a file from the user through task_obtain_file_from_user.
2. Transform the file into a pickled Pandas DataFrame using task_convert_file_type.
3. Cleanse and analyze the file through task_data_cleansing_and_analysis_for_pandas.
4. Present the results through task_present_table_for_pandas.
5. Perform additional, more complex analyses through task_explore_data_for_pandas.
ID: 353
Created: April 9, 2019, 5:11 p.m.
The below is the JSON description of this object.
It is annotated with links to the documentation of each component.
You can hide fields with default values to make things clearer, and copy it to a clipboard to make creating similar Rules and Options easier.
The purpose of this Rule is the initial exploration of the content of a table.
1. Acquire a file from the user through task_obtain_file_from_user.
2. Transform the file into a pickled Pandas DataFrame using task_convert_file_type.
3. Cleanse and analyze the file through task_data_cleansing_and_analysis_for_pandas.
4. Present the results through task_present_table_for_pandas.
5. Perform additional, more complex analyses through task_explore_data_for_pandas.", "dependencies" : [ { "symbol" : "demo_data_exploration", "weight" : 1.0, "comment_filter" : null } ], "threshold" : 1.0, "trigger" : { "repeat" : "never", "arguments" : [], "deactivate_if" : {} }, "actions" : [ { "type" : "create_option", "var" : "demo-data-exploration-stage-1", "name" : "demo-data-exploration-stage-1", "description" : null, "confidence" : 1000.0, "trigger" : { "repeat" : "never", "arguments" : [], "deactivate_if" : {} }, "display" : null, "actions" : [ { "type" : "create_tag", "var" : "task_1", "symbol" : "task_obtain_file_from_user", "comment" : null, "weight" : null, "arguments" : [], "mark_with" : ["signal"] }, { "type" : "create_tag", "var" : "require_1_1", "symbol" : "require_a_file", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_1" } ], "mark_with" : ["signal"] }, { "type" : "create_tag", "var" : null, "symbol" : "!set_status_message", "comment" : "Getting input...", "weight" : null, "arguments" : [], "mark_with" : [] }, { "type" : "create_option", "var" : "demo-data-exploration-stage-2", "name" : "demo-data-exploration-stage-2", "description" : null, "confidence" : 1000.0, "trigger" : { "repeat" : "never", "arguments" : [ { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : "task_1", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : null, "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : true, "arguments" : {} }, { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "!provide", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : { "type" : "tag", "var" : null, "role" : "required", "targeted_by" : [], "equals" : "require_1_1", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : null, "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : {} }, "1" : { "type" : "file", "var" : "file_initial", "role" : "required", "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "name_matches" : null } } } ], "deactivate_if" : { "task_1" : ["is_nullified"] } }, "display" : null, "actions" : [ { "type" : "create_tag", "var" : "task_2", "symbol" : "task_convert_file_type", "comment" : null, "weight" : null, "arguments" : [], "mark_with" : ["signal"] }, { "type" : "create_tag", "var" : "require_2_1", "symbol" : "require_format_pickled_pandas_dataframe", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_2" }, { "type" : "variable", "nullable" : false, "var" : "file_initial" } ], "mark_with" : ["signal"] }, { "type" : "create_tag", "var" : null, "symbol" : "!set_status_message", "comment" : "Converting file format...", "weight" : null, "arguments" : [], "mark_with" : [] }, { "type" : "create_option", "var" : "demo-data-exploration-stage-3-hotfix-for-file-conversion-task", "name" : "demo-data-exploration-stage-3-hotfix-for-file-conversion-task", "description" : "As of 2019-01-10, the Rules working on task_convert_file_type don't realize when a file doesn't need to be converted because it already has the correct filetype. That only happens when Interact_ask_user_if_they_want_file_conversion is used to create the file. This Option performs that check. Its confidence is set so high that it is practically guaranteed it will run before anything else.", "confidence" : 9999.0, "trigger" : { "repeat" : "never", "arguments" : [ { "type" : "file", "var" : "fileAlreadyIsPickle", "role" : "optional", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : "file_initial", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "name_matches" : "^.*(\\.pickle|\\.pkl)$" } ], "deactivate_if" : { "require_2_1" : ["is_nullified", "is_provided"] } }, "display" : null, "actions" : [ { "type" : "conditional", "if" : { "type" : "reference_exists", "exists" : "fileAlreadyIsPickle" }, "then" : [ { "type" : "create_tag", "var" : null, "symbol" : "!provide", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "require_2_1" }, { "type" : "variable", "nullable" : false, "var" : "file_initial" } ], "mark_with" : [] } ], "else" : [] } ] }, { "type" : "create_option", "var" : "demo-data-exploration-stage-3", "name" : "demo-data-exploration-stage-3", "description" : null, "confidence" : 1000.0, "trigger" : { "repeat" : "never", "arguments" : [ { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : "task_2", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : null, "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : true, "arguments" : {} }, { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "!provide", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : { "type" : "tag", "var" : null, "role" : "required", "targeted_by" : [], "equals" : "require_2_1", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : null, "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : {} }, "1" : { "type" : "file", "var" : "file_after_type_conversion", "role" : "required", "targeted_by" : [ { "type" : "tag", "_comment" : "If the file_after_type_conversion is also the file that was targeted by require_2_1, it means the file was not changed by task_2, task_convert_file_type", "var" : "fileIsUnchanged", "role" : "optional", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : "require_2_1", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : null, "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : {} } ], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "name_matches" : null } } } ], "deactivate_if" : { "task_2" : ["is_nullified"] } }, "display" : null, "actions" : [ { "type" : "conditional", "_comment" : "If the file was changed compared to the one that was uploaded, offer the cleaned version for download.", "if" : { "type" : "not", "not" : { "type" : "reference_exists", "exists" : "fileIsUnchanged" } }, "then" : [ { "type" : "create_option", "var" : "demo-data-exploration-stage-3-offer-download", "name" : "demo-data-exploration-stage-3-offer-download", "description" : null, "confidence" : 1000.0, "trigger" : { "repeat" : "never", "arguments" : [], "deactivate_if" : {} }, "display" : null, "actions" : [ { "type" : "create_message", "var" : null, "visibility" : "all", "message_components" : [ { "type" : "downloadable_file", "scenario_history" : true, "scenario_history_title" : "The file after cleaning and file type conversion", "scenario_history_description" : null, "text" : "Download the file after cleaning and converting file types.", "file" : { "type" : "variable", "nullable" : false, "var" : "file_after_type_conversion" } } ] } ] } ], "else" : [] }, { "type" : "create_tag", "var" : "task_3", "symbol" : "task_data_cleansing_and_analysis_for_pandas", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "file_after_type_conversion" } ], "mark_with" : ["signal"] }, { "type" : "create_tag", "var" : "require_3_1", "symbol" : "require_open_ended_work", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_3" } ], "mark_with" : [] }, { "type" : "create_tag", "var" : null, "symbol" : "!set_status_message", "comment" : "Cleaning and analyzing file...", "weight" : null, "arguments" : [], "mark_with" : [] }, { "type" : "create_tag", "var" : "theFileInfoTag", "symbol" : "modifiable_file", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "file_after_type_conversion" }, { "type" : "variable", "nullable" : false, "var" : "task_3" } ], "mark_with" : [] }, { "type" : "create_tag", "var" : null, "symbol" : "current_file", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "theFileInfoTag" }, { "type" : "variable", "nullable" : false, "var" : "file_after_type_conversion" } ], "mark_with" : [] }, { "type" : "create_option", "var" : "demo-data-exploration-stage-4", "name" : "demo-data-exploration-stage-4", "description" : null, "confidence" : 1000.0, "trigger" : { "repeat" : "never", "arguments" : [ { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : "task_3", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : null, "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : true, "arguments" : {} }, { "type" : "tag", "_comment" : "It's possible that the modifiable_file Tag gets replaced in the meantime, for example by Demo-data-exploration-import-analysis. So we need to make sure we have the latest version.", "var" : "theFileInfoTag", "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [ { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "current_file", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : "theFileInfoTag", "1" : "file_after_type_conversion" } } ], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "modifiable_file", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : {} }, { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "current_file", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : "theFileInfoTag", "1" : { "type" : "file", "var" : "file_after_analysis", "role" : "required", "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "name_matches" : null } } } ], "deactivate_if" : { "task_3" : ["is_nullified"] } }, "display" : null, "actions" : [ { "type" : "create_option", "var" : "demo-data-exploration-stage-4-offer-download", "name" : "demo-data-exploration-stage-4-offer-download", "description" : "Offer the analyzed file for download. This has a low confidence so that it is only offered after the visualizations pf task_present_table_for_pandas have been created and displayed.", "confidence" : 10.0, "trigger" : { "repeat" : "never", "arguments" : [], "deactivate_if" : {} }, "display" : null, "actions" : [ { "type" : "create_message", "var" : null, "visibility" : "all", "message_components" : [ { "type" : "downloadable_file", "scenario_history" : true, "scenario_history_title" : "The file after the analysis", "scenario_history_description" : null, "text" : "Download the file after the analysis.", "file" : { "type" : "variable", "nullable" : false, "var" : "file_after_analysis" } } ] } ] }, { "type" : "create_tag", "var" : "task_4", "symbol" : "task_present_table_for_pandas", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "theFileInfoTag" } ], "mark_with" : ["signal"] }, { "type" : "create_tag", "var" : null, "symbol" : "require_present_table_main_info", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_4" } ], "mark_with" : [] }, { "type" : "create_tag", "var" : null, "symbol" : "require_present_table_column_correlations_info", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_4" } ], "mark_with" : [] }, { "type" : "loop", "for" : "theColumn", "in" : { "type" : "tag", "var" : null, "role" : "required", "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "column", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : "theFileInfoTag" } }, "do" : [ { "type" : "create_tag", "var" : null, "symbol" : "require_present_table_column_info", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_4" }, { "type" : "variable", "nullable" : false, "var" : "theColumn" } ], "mark_with" : [] } ] }, { "type" : "loop", "for" : "geographicInfoTag", "in" : { "type" : "tag", "var" : null, "role" : "required", "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "info_geographic_coordinate_column_pair", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : { "type" : "tag", "var" : null, "role" : "required", "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "column", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : "theFileInfoTag" } } } }, "do" : [ { "type" : "create_tag", "var" : null, "symbol" : "require_present_table_geographical_location", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_4" }, { "type" : "variable", "nullable" : false, "var" : "geographicInfoTag" } ], "mark_with" : [] } ] }, { "type" : "loop", "for" : "geographicInfoTag", "in" : { "type" : "tag", "var" : null, "role" : "required", "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "info_geographic_place_name", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : { "type" : "tag", "var" : null, "role" : "required", "targeted_by" : [], "equals" : null, "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : "column", "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : null, "arguments" : { "0" : "theFileInfoTag" } } } }, "do" : [ { "type" : "create_tag", "var" : null, "symbol" : "require_present_table_geographical_location", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_4" }, { "type" : "variable", "nullable" : false, "var" : "geographicInfoTag" } ], "mark_with" : [] } ] }, { "type" : "create_tag", "var" : null, "symbol" : "!set_status_message", "comment" : "Creating visualizations...", "weight" : null, "arguments" : [], "mark_with" : [] }, { "type" : "create_option", "var" : "demo-data-exploration-stage-5", "name" : "demo-data-exploration-stage-5", "description" : null, "confidence" : 1000.0, "trigger" : { "repeat" : "never", "arguments" : [ { "type" : "tag", "var" : null, "role" : "required", "search_type" : "last", "search_postfilter" : null, "targeted_by" : [], "equals" : "task_4", "created_by" : null, "created_earlier_than" : null, "created_in_same_event_as" : null, "created_later_than" : null, "is_reserved" : null, "symbol" : null, "comment" : null, "comment_contains" : null, "comment_matches" : null, "weight" : null, "min_weight" : null, "max_weight" : null, "nullified" : false, "requirement_is_provided" : null, "task_is_finished" : true, "arguments" : {} } ], "deactivate_if" : { "task_4" : ["is_nullified"] } }, "display" : null, "actions" : [ { "type" : "create_tag", "var" : "task_5", "symbol" : "task_explore_data_for_pandas", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "theFileInfoTag" } ], "mark_with" : ["signal"] }, { "type" : "create_tag", "var" : "require_5_1", "symbol" : "require_open_ended_work", "comment" : null, "weight" : null, "arguments" : [ { "type" : "variable", "nullable" : false, "var" : "task_5" } ], "mark_with" : [] }, { "type" : "create_tag", "var" : null, "symbol" : "!set_status_message", "comment" : "Loading advanced analyses...", "weight" : null, "arguments" : [], "mark_with" : [] } ] } ] } ] } ] } ] } ], "existing_variables" : { "demo-data-exploration-stage-1" : { "type" : "option", "value" : null } } }
all versions of this Rule:
Version 26
Version 25 (deleted)
Version 24 (deleted)
Version 23 (deleted)
Version 22 (deleted)
Version 21 (deleted)
Version 20 (deleted)
Version 19 (deleted)
Version 18 (deleted)
Version 17 (deleted)
Version 16 (deleted)
Version 15 (deleted)
Version 14 (deleted)
Version 13 (deleted)
Version 12 (deleted)
Version 11 (deleted)
Version 10 (deleted)
Version 9 (deleted)
Version 8 (deleted)
Version 7 (deleted)
Version 6 (deleted)
Version 5 (deleted)
Version 4 (deleted)
Version 3 (deleted)
Version 2 (deleted)
Version 1 (deleted)