Commit c0fc3d6e authored by Leigh B. Stoller's avatar Leigh B. Stoller

Add a table to record node failures during start/stop run. This is so

we have a record of what nodes failed to respond during the
synchronous parts of the start and stop experiment run. Data is stored
for now, but not sure how it will be used later. The main goal is to
avoid the problems we see with plab nodes where they do not respond,
and start/stop run hang and fail.
parent e7882dd8
......@@ -604,6 +604,19 @@ CREATE TABLE experiment_template_instance_bindings (
KEY pidtid (pid,eid)
) TYPE=MyISAM;
--
-- Table structure for table `experiment_template_instance_deadnodes`
--
CREATE TABLE experiment_template_instance_deadnodes (
instance_idx int(10) unsigned NOT NULL default '0',
exptidx int(10) unsigned NOT NULL default '0',
runidx int(10) unsigned NOT NULL default '0',
node_id varchar(32) NOT NULL default '',
vname varchar(32) NOT NULL default '',
PRIMARY KEY (instance_idx, runidx, node_id)
) TYPE=MyISAM;
--
-- Table structure for table `experiment_template_instances`
--
......
......@@ -3703,3 +3703,14 @@ last_net_act,last_cpu_act,last_ext_act);
alter table experiment_runs add swapmod tinyint(1) NOT NULL default '0';
4.91: Add a table to store the ids of nodes that fail during an
instance (well, run).
CREATE TABLE experiment_template_instance_deadnodes (
instance_idx int(10) unsigned NOT NULL default '0',
exptidx int(10) unsigned NOT NULL default '0',
runidx int(10) unsigned NOT NULL default '0',
node_id varchar(32) NOT NULL default '',
vname varchar(32) NOT NULL default '',
PRIMARY KEY (instance_idx, runidx, node_id)
) TYPE=MyISAM;
......@@ -390,3 +390,21 @@ CREATE TABLE experiment_run_bindings (
PRIMARY KEY (exptidx, runidx, name)
) TYPE=MyISAM;
#
# This table holds the names of nodes that failed to respond during a start
# or stop run. This is mostly informational at this point.
#
CREATE TABLE experiment_template_instance_deadnodes (
-- Backlink to the instance above.
instance_idx int(10) unsigned NOT NULL default '0',
-- The experiment index (into the current experiments table).
exptidx int(10) unsigned NOT NULL default '0',
-- The run index
runidx int(10) unsigned NOT NULL default '0',
-- The node that failed.
node_id varchar(32) NOT NULL default '',
-- The vname of the node since that is typically more useful.
vname varchar(32) NOT NULL default '',
PRIMARY KEY (instance_idx, runidx, node_id)
) TYPE=MyISAM;
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment