ptopgen.in 63.8 KB
Newer Older
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1
#!/usr/bin/perl -w
Leigh B. Stoller's avatar
Leigh B. Stoller committed
2
3
4

#
# EMULAB-COPYRIGHT
Weibin Sun's avatar
Weibin Sun committed
5
# Copyright (c) 2000-2011 University of Utah and the Flux Group.
Leigh B. Stoller's avatar
Leigh B. Stoller committed
6
7
8
# All rights reserved.
#

9
10
use English;
use Getopt::Std;
11
use Math::BigInt;
12
use List::Util 'shuffle';
Leigh B. Stoller's avatar
Leigh B. Stoller committed
13

14
15
use lib "@prefix@/lib";
use libdb qw(TBGetSiteVar);
16
use libadminctrl;
17
18
19
20
use libptop;

my $top = libptop->Create();

21
22
my $PGENISUPPORT = @PROTOGENI_SUPPORT@;

23
24
$NO_GENI = "0";
$V_0_1 = "0.1";
25
$V_0_2 = "0.2";
26
27
$V_2 = "2";

28
29
30
31
32
33
if ($PGENISUPPORT) {
  require GeniHRN;
}

use GeniHRN;

34
35
sub usage()
{
Leigh B. Stoller's avatar
Leigh B. Stoller committed
36
    print("Usage: ptopgen [-v] [-s switch] [-p pid [-e eid]] [-m factor] " .
37
	  "[-n c/e] [-x] [-g (0.1 | 2)] [-c component-name]".
38
	  "[-l type-limit-file] [-z]\n" .
39
	  "       -p include nodes the project has permission to use\n".
40
	  "       -e include given experiments resources\n" .
41
42
	  "          in the ptopfile (as if they were free)\n" .
	  "       -v Include stuff for topologies with virtual nodes\n".
43
	  "       -r Include stuff for topologies with widearea nodes\n".
44
#	  "       -s Include stuff for topologies with simulated nodes\n".
Leigh B. Stoller's avatar
Leigh B. Stoller committed
45
	  "       -h Include stuff for topologies with shared nodes\n".
46
	  "       -a Include even reserved nodes\n".
Leigh B. Stoller's avatar
Leigh B. Stoller committed
47
	  "       -m Override multiplex_factor\n".
48
	  "       -u Prune unused interfaces of allocated nodes (-e)\n".
49
	  "       -c Delay capacity override\n".
50
	  "       -n Add in modelnet core and edge node features\n".
51
	  "       -x Output into the new xml ptop format\n".
52
	  "       -g version With -x, geni version. Must be '0', '0.1' or '2'\n".
53
	  "       -l specifies the location of the type limit file\n" .
54
55
          "       -1 Print an rspec containing only the node component-name" .
	  "       -z Randomize node output order");
56
        exit(-1);
57
}
58

59
my $optlist = "s:e:m:vp:rSan:c:uxg:h1:l:z";
60
my $mfactor;
61
my $virtstuff = 0;
62
my $widearea  = 0;
63
my $simstuff  = 0;
64
my $allnodes  = 0;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
65
66
my $mnetcores = 0;
my $mnetedges = 0;
67
my $prune     = 0;
68
my $do_xml    = 0;
69
my $genimode  = $NO_GENI;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
70
my $useshared = 0;
71
my $component_name = undef;
72
my $randomize = 0;
73

74
my $OURDOMAIN = "@OURDOMAIN@";
75
my $MAINSITE  = @TBMAINSITE@;
76
my $cmuuid = TBGetSiteVar('protogeni/cm_uuid');
77
78
79
80
my $cmurn = "";
if ($PGENISUPPORT) {
    $cmurn = GeniHRN::Generate($OURDOMAIN, "authority", "cm");
}
81

82
my $default_long = undef;
83
TBGetSiteVar('general/default_longitude', \$default_long);
84
my $default_lat = undef;
85
TBGetSiteVar('general/default_latitude', \$default_lat);
86
my $default_country = undef;
87
TBGetSiteVar('general/default_country', \$default_country);
88

89
my $delaycap_override;
90

91
92
93
94
#
# Turn off line buffering on output
#
$| = 1;
95
96
97
98
99
100
101
102
103
104
105
106

# Settings - Change these to your particular network.

#
# Also bogus. The interfaces table does not hold entries for the switch
# side of each link. It will have to at some point, when we have something
# other than 100Mbs ports (say, gbit ports).
#
# Speed in in Kbs!
#
my $default_switchport_speed    = 100000;

107
108
109
110
111
112
#
# Yet more bogosity - we hardcode this weight, which is given to wide-area
# (primarily plab) nodes to prefer spreading across sites
#
my $site_weight = 0.99;

113
114
######################################################################

115
my $TBROOT = "@prefix@";
116
use lib '@prefix@/lib';
117
require exitonwarn;
118
use libdb;
Kevin Atkinson's avatar
Kevin Atkinson committed
119
use libtblog;
120
use Experiment;
121
use Node;
122
use NodeType;
123
use Lan;
Kevin Atkinson's avatar
Kevin Atkinson committed
124
125

tblog_stop_capture('stdout');
Leigh B. Stoller's avatar
Leigh B. Stoller committed
126

127
128
my $TRACK_INTERSWITCH_BANDWIDTH = "@TRACK_INTERSWITCH_BANDWIDTH@";

129
130
my %switches	  = ();
my %permissions   = ();
131
132
my %typemap       = ();
my %auxtypemap    = ();
Timothy Stack's avatar
   
Timothy Stack committed
133
my %areamap       = ();
134
my %globalcounts  = ();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
135
my %interfacestate= ();
136
my %vinterfaces   = ();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
137
my %rusagedata    = ();
138

139
140
141
my $DEADPID = NODEDEAD_PID();
my $DEADEID = NODEDEAD_EID();

142
my $pid;
143
my $exempt_eid;
144
my $switchtouse;
145
my $experiment;
146

147
148
my $typelimitfile = "";

149
150
sub fatal($);

151
152
153
154
155
156
157
158
159
160
161
162
163
164
#
# Parse command arguments. Once we return from getopts, all that should be
# left are the required arguments.
#
%options = ();
if (! getopts($optlist, \%options)) {
    usage();
}
if (@ARGV) {
    usage();
}
if (defined($options{"s"})) {
    $switchtouse = $options{"s"};
}
165
166
167
if (defined($options{"m"})) {
    $mfactor = $options{"m"};
}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
168
169
170
if (defined($options{"h"})) {
    $useshared = 1;
}
171
172
173
if (defined($options{"v"})) {
    $virtstuff = 1;
}
174
175
176
if (defined($options{"r"})) {
    $widearea = 1;
}
177
178
179
if (defined($options{"S"})) {
    $simstuff = 1;
}
180
181
182
if (defined($options{"p"})) {
    $pid = $options{"p"};
}
183
184
185
if (defined($options{"a"})) {
    $allnodes = 1;
}
186
187
188
if (defined($options{"u"})) {
    $prune = 1;
}
189
190
191
if (defined($options{"c"})) {
    $delaycap_override = $options{"c"};
}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
192
193
194
195
196
197
198
199
200
if (defined($options{"n"})) {
    if ($options{"n"} =~ /(\d*),(\d*)/) {
	$mnetcores = $1;
	$mnetedges = $2;
    }
    else {
	usage();
    }
}
201
if (defined($options{"e"})) {
202
203
204
    $exempt_eid = $options{"e"};
    usage()
	if (!defined($pid));
205
    $experiment = Experiment->Lookup($pid, $exempt_eid);
206
207
    die("Could not look up experiment $pid,$exempt_eid\n")
	if (!defined($experiment));
208
}
209
if (defined($options{"x"})) {
210
211
212
213
214
    if (defined($options{"g"}) && $PGENISUPPORT) {
	$useshared = 1;
	$virtstuff = 1;
	$genimode = $options{"g"};
    }
215
216
    $do_xml = 1;
}
217
218
219
if (defined($options{"l"})) {
    $typelimitfile = $options{"l"};
}
220
221
222
if (defined($options{"1"})) {
    $component_name = $options{"1"};
}
223
224
225
if (defined($options{"z"})) {
    $randomize = 1;
}
226

227
usage()
228
    if ($prune && !defined($exempt_eid)
229
230
231
	|| ($genimode ne $NO_GENI
	    && $genimode ne $V_0_1
	    && $genimode ne $V_0_2
232
	    && $genimode ne $V_2));
233

234
235
$fake_inet_switch = "internet";
$fake_inet_iface = "(null)";
236
237
238
$fake_air_switch = "airswitch";
$fake_air_iface = "(null)";
if ($genimode ne $NO_GENI) {
239
    $fake_inet_iface = "border";
240
    $fake_air_iface = "air";
241
242
}

243
244
print_header();

245
my %nodetointerface;
246
247
my %interfaceroles = ();
my %interfacetypes = ();
248
my %interfaceips = ();
249
250

# Read interfaces
251
my $result =
252
    DBQueryFatal("SELECT node_id,card,port,iface,interface_type,role,IP" .
253
		 " from interfaces " .
254
		 ($genimode ne $NO_GENI ? "where role!='gw'" : ""));
255
		 
256
while (($node,$card,$port,$iface,$type,$role,$ip) = $result->fetchrow_array) {
257
258
259
260
261
    push @{ $nodetointerface{"$node"} }, $iface;
    $interfacemap{"$node:$card:$port"} = $iface;
    if ((defined $type) && ($type ne "")) {
	$interfacetypes{"$node:$card:$port"} = $type;
    }
262
263
264
    if ((defined $role) && ($role ne "")) {
	$interfaceroles{"$node:$iface"} = $role;
    }
265
266
267
    if ((defined $ip) && ($ip ne "")) {
	$interfaceips{"$node:$iface"} = $ip;
    }
268
269
}

270
271
272
273
my %nodetouuid;
my %nodetoavailable;

$result = DBQueryFatal("SELECT n.node_id, n.eventstate, n.role, n.uuid, " .
274
		       "nt.isremotenode, " .
275
		       "dedicated_wa_types.attrvalue, b.erole, " .
276
		       "n.reserved_pid, b.eid " .
277
278
279
280
281
282
283
284
285
286
		       "from nodes as n " .
		       "left join reserved as b on n.node_id=b.node_id " .
		       "left join node_types as nt on nt.type=n.type " .
		       "left outer join " .
		       "  (select type, attrvalue " .
		       "   from node_type_attributes " .
		       "   where attrkey='dedicated_widearea' " .
		       "   group by type) as dedicated_wa_types " .
		       "  on nt.type=dedicated_wa_types.type " .
		       "where nt.isvirtnode = 0 or nt.isvirtnode is null;");
287
while (($node,$eventstate, $role, $uuid, $isremotenode,
288
	$wa_attrvalue, $erole,
289
	$reserved_pid, $reserved_eid) = $result->fetchrow_array) {
290
291
292
293
    if (defined($uuid) && $uuid ne "")
    {
	$nodetouuid{$node} = $uuid;
    }
294
295
296
297
    my $islocal = $role eq 'testnode'
	&& ((! defined($isremotenode) || $isremotenode == 0)
	    || (defined($wa_attrvalue) && $wa_attrvalue == 1));
    my $isup = defined($eventstate)
298
299
300
301
	&& ($eventstate eq TBDB_NODESTATE_ISUP
	    || $eventstate eq TBDB_NODESTATE_PXEWAIT
	    || $eventstate eq TBDB_NODESTATE_POWEROFF
	    || $eventstate eq TBDB_NODESTATE_ALWAYSUP);
302
303
    my $isshared = (defined($erole)
		    && $erole eq "sharedhost"
304
305
306
307
		    && $useshared
		    && $isup);
    my $isreserved = (defined($reserved_eid)
		      || (defined($reserved_pid)
Leigh B. Stoller's avatar
Leigh B. Stoller committed
308
			  && (! defined($pid) || $pid ne $reserved_pid)));
309
310
311
    my $isfree = (!$islocal
		  || (! $isreserved && $isup)
		  || $isshared);
312
313
314
    $nodetoavailable{$node} = $isfree;
}

315
# Read class/type maps
316
$result =
317
318
319
    DBQueryFatal("select class,type,isvirtnode from node_types");

while (my ($class,$type,$isvirt) = $result->fetchrow_array) {
320
321
322
    $map = {};
    $map->{'CLASS'}    = $class;
    $map->{'ISVIRT'}   = $isvirt;
323
324
325
326
327
328
329
330
331
    my $typeinfo       = NodeType->Lookup($type);
    $map->{'DELAYCAP'} = $typeinfo->delay_capacity();
    $map->{'VIRTCAP'}  = $typeinfo->virtnode_capacity();
    $map->{'SIMCAP'}   = $typeinfo->simnode_capacity();
    $map->{'SPEED'}    = $typeinfo->frequency();
    $map->{'RAM'}      = $typeinfo->memory();
    $map->{'OSID'}     = $typeinfo->default_osid();
    $map->{'IMAGEABLE'}= $typeinfo->imageable();
    $map->{'TRIVSPEED'}= $typeinfo->trivlink_maxspeed();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
332
    $map->{'SHARED'}   = $typeinfo->shared();
333
    $map->{'TYPEINFO'} = $typeinfo;
334
335
    $map->{'FEATURES'} = [];
    $map->{'AUXTYPES'} = {};
336
    $map->{'OSLIST'} = [];
337
    $typemap{$type} = $map;
338
339
340
341
342
343

    # Default is permission to use all types,classes. 
    $permissions{$class} = 1;
    $permissions{$type}  = 1;
}

Timothy Stack's avatar
   
Timothy Stack committed
344
345
# Read node_startloc
$result = DBQueryFatal("select node_id,building from node_startloc");
Timothy Stack's avatar
   
Timothy Stack committed
346
while (($node,$building) = $result->fetchrow_array) {
347
348
349
350
    # TODO: This screws up the meaning of the @features list. Now it
    # is not just a list of feature strings, but a list of strings
    # which might themselves be space-delimited lists of feature
    # strings. Fix this.
Timothy Stack's avatar
   
Timothy Stack committed
351
    $areamap{$node} .= " area-$building:0";
Timothy Stack's avatar
   
Timothy Stack committed
352
353
}

354
355
356
357
358
#
# Read the features table for each type.
# 
$result = DBQueryFatal("select type, feature, weight from node_type_features");
while (my ($type, $feature, $weight) = $result->fetchrow()) {
359
360
361
362
363
364
365
366
367
368
    push(@{$typemap{$type}->{'FEATURES'}}, "$feature:$weight");
}

#
# Read the auxtypes for each type.
# 
$result = DBQueryFatal("select auxtype,type from node_types_auxtypes");
while (my ($auxtype,$type) = $result->fetchrow()) {
    $typemap{$type}->{'AUXTYPES'}->{$auxtype} = 1;
    $auxtypemap{$auxtype} = $type;
369
370
}

371
372
373
374
375
376
377
378
379
380
381
382
#
# Read the features table for each individual node
#
$result = DBQueryFatal("select node_id, feature, weight from node_features");
while (my ($node_id, $feature, $weight) = $result->fetchrow()) {
    if (! defined($features{$node_id})) {
	$features{$node_id} = ["$feature:$weight"];
	next;
    } else {
	push @{$features{$node_id}}, "$feature:$weight";
    }
}
383
384
385
386
387
388
389
390
391
#
# Read in the node_auxtypes table for each node.
#
$result = DBQueryFatal("select node_id, type, count from node_auxtypes");
while (my ($node_id, $type, $count) = $result->fetchrow()) {
    if (! defined($auxtypes{$node_id})) {
	$auxtypes{$node_id} = ["$type:$count"];
	next;
    }
392
    push @{$auxtypes{$node_id}}, "$type:$count";
393
}
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
#
# Read the permission table if given a pid. If there is an entry in
# the table for a type/class, then permission is granted only if there
# is a record with the pid. If not, remove the permission granted above.
# 
if (defined($pid)) {
    $result =
	DBQueryFatal("select type from nodetypeXpid_permissions");
    
    while (my ($type) = $result->fetchrow_array) {
	$permissions{$type} = 0;
    }
    
    $result =
	DBQueryFatal("select type from nodetypeXpid_permissions ".
		     "where pid='$pid'");
    
    while (my ($type) = $result->fetchrow_array) {
	$permissions{$type} = 1;
    }
414
415
}

416
417
418
419
420
421
422
#
# Read the table of which image types are supported on which hardware - we
# limit this to global images and ones that match the PID (if given) We do this
# limiting for two reasons:
# 1) To avoid an explosion in the number of features for nodes
# 2) To avoid information leaks, allowing projects to see each other's images
# 
423
my $osidquery = "select distinct o.osid, oi.type, o.osname, o.pid, o.OS, o.version, o.description,o.protogeni_export from os_info as o " .
424
425
426
427
428
429
430
	"left join osidtoimageid as oi on o.osid = oi.osid " .
	"left join images as i on oi.imageid = i.imageid ".
	"where i.global = 1";
if ($pid) {
    $osidquery .= " or i.pid='$pid'";
}

431
432
433
434
my $defaultosidquery = 'select distinct o.osid, t.type, o.osname, o.pid, o.OS, o.version, o.description, o.protogeni_export '.
    'from os_info as o left join node_type_attributes as t '.
    'on (o.osid=t.attrvalue) where t.attrkey="default_osid"';

435
436
437
438
#
# For subOS support (i.e., vnode OSes running atop vhost OSes), we have to
# check both the subosid and all the parent_osid it can run on.
#
439
my $subosidquery = "select distinct o.osid,o.parent_osid from os_submap as o " .
440
441
442
443
444
445
446
447
448
449
450
451
452
453
	"left join osidtoimageid as oi1 on o.osid = oi1.osid " .
	"left join osidtoimageid as oi2 on o.parent_osid = oi2.osid " .
	"left join images as i1 on oi1.imageid = i1.imageid ".
	"left join images as i2 on oi2.imageid = i2.imageid ".
	"where (i1.global = 1";
if ($pid) {
    $subosidquery .= " or i1.pid='$pid'";
}
$subosidquery .= ") and (i2.global = 1";
if ($pid) {
    $subosidquery .= " or i2.pid='$pid'";
}
$subosidquery .= ")";

454
455
456
457
458
459
460
461
462
463
464
465
our %node_type_osids;
our %osid_node_types;
our %osid_subosids;
our %osid_name;
our %osid_pid;
our %osid_os;
our %osid_version;
our %osid_description;
our %node_countries;
our %node_latitudes;
our %node_longitudes;

466
$result = DBQueryFatal($osidquery);
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
processOs($result);

$result = DBQueryFatal($defaultosidquery);
processOs($result);

sub processOs
{
    my $result = shift(@_);
    while (my ($osid,$type,$osname,$ospid,$osos,
	       $osversion,$osdescription,$geni) = $result->fetchrow()) {
	if ($typemap{$type}) {
	    my $default = $typemap{$type}->{'OSID'};
	    if ($geni eq 1 ||
		(defined($default) && $default eq $osid)) {
		push(@{ $typemap{$type}->{'OSLIST'} }, $osid);
		$osid_name{$osid} = $osname;
		$osid_pid{$osid} = $ospid;
		$osid_os{$osid} = $osos;
		$osid_version{$osid} = $osversion;
		$osid_description{$osid} = $osdescription;
	    }
	}
	if ($node_type_osids{$type}) {
	    push @{$node_type_osids{$type}}, $osid;
	} else {
	    $node_type_osids{$type} = [$osid];
	}
	#
	# We have to maintain a data structure telling us which types an OSID could
	# be on for use below with generic OSIDs
	#
	if ($osid_node_types{$osid}) {
	    push @{$osid_node_types{$osid}}, $type;
	} else {
	    $osid_node_types{$osid} = [$type];
502
	}
503
504
    }
}
505
506
507
508
509
510
511
512
513
514
515
#
# XXX Note below that for now, subosids cannot redirect to other subosids.
#
$result = DBQueryFatal($subosidquery);
while (my ($subosid,$osid) = $result->fetchrow()) {
    if ($osid_subosids{$osid}) {
	push @{$osid_subosids{$osid}}, $subosid;
    } else {
	$osid_subosids{$osid} = [$subosid];
    }
}
516
517
518
519
520

#
# We also have to resolve the 'generic' OSIDs, which use the nextosid field to
# redirect to another OSID
#
521
$result = DBQueryFatal("select osid from os_info where " .
522
    "nextosid is not null");
523
while (my ($osid) = $result->fetchrow()) {
524
525
526
    #
    # Check to see if they were allowed to use the real OSID
    #
527
    my $realosid = TBResolveNextOSID($osid, $pid, $exempt_eid);
528
529
    if ($osid_node_types{$realosid}) {
	foreach my $type (@{$osid_node_types{$realosid}}) {
530
531
532
533
534
	    push @{$node_type_osids{$type}}, $osid;
	}
    }
}

535
# Print switches
536
if (defined($switchtouse) && ! defined($component_name)) {
537
538
539
    # Should probably get the last four args out of the database, but I don't
    # think we ever actually use this case...
    print_switch($switchtouse,undef,undef,undef,undef);
540
541
    $switches{$switchtouse} = 1;
}
542
elsif (! defined($component_name)) {
543
    $result =
544
545
546
547
548
549
550
551
	DBQueryFatal("select n.node_id,n.uuid,country,latitude,longitude ".
                     "   from nodes as n ".
		     "left join widearea_nodeinfo as wn ".
                     "     on n.node_id=wn.node_id " .
		     "left join node_types as nt on ".
		     "     nt.type=n.type ".
		     "where role='testswitch' or role='widearea_switch' or ".
		     "      (role='testnodefoo' and nt.isswitch=1)");
552

553
554
555
    while (($switch, $uuid, $country, $latitude, $longitude) =
            $result->fetchrow_array) {
	print_switch($switch, $uuid, $country, $latitude, $longitude);
556
557
	$switches{$switch} = 1;
    }
558
}
559

560
561
562
563
564
565
#
# Get the global counts.
#
$result =
    DBQueryFatal("select phys_nodeid,count(phys_nodeid) from reserved as r ".
		 "left join nodes as n on n.node_id=r.node_id ".
566
567
568
569
		 "where n.node_id!=n.phys_nodeid ".
		 (defined($exempt_eid) ?
		  "and not (pid='$pid' and eid='$exempt_eid') " : " ") .
		 "group by phys_nodeid");
570
571
572
573
while (my ($node_id,$count) = $result->fetchrow_array) {
    $globalcounts{$node_id} = $count;
}

574
# Find available nodes.
575
#
576
577
# This first query deals with just local nodes. Local nodes can host
# virtnodes, according to the delay_capacity in the types table. 
578
#
579

580
# the ordinary free condition for a local node.
581
582
my $free_condition = "(b.node_id is null and ".
                     " (np.eventstate='" . TBDB_NODESTATE_ISUP . "' or ".
583
                     "  np.eventstate='" . TBDB_NODESTATE_PXEWAIT . "' or ".
584
                     "  np.eventstate='" . TBDB_NODESTATE_POWEROFF . "' or ".
585
                     "  np.eventstate='" . TBDB_NODESTATE_ALWAYSUP . "')) ";
586

587
588
589
590
591
if (defined($pid)) {
    $free_condition = "($free_condition and ".
	"(np.reserved_pid is null or np.reserved_pid='$pid'))";
}

592
593
594
595
# if the user has specified an exempt pid/eid, 
# then view any node which is reserved to that experiment as available.
if (defined($exempt_eid)) {
    $free_condition = "($free_condition or ".
596
	"(b.pid='$pid' and b.eid='$exempt_eid'))"; 
597
}
Chad Barb's avatar
Chad Barb committed
598

599
600
601
# In shared mode, allow allocated nodes whose sharing_mode is set.
if ($useshared) {
    $free_condition = "($free_condition or ".
602
	"(b.node_id is not null && b.erole='sharedhost' && ".
603
604
605
	" np.eventstate='" . TBDB_NODESTATE_ISUP . "'))";
}

606
607
608
609
610
611
# If the user wants all nodes, we consider everything to be free (this
# overrides the other possible free conditions
if ($allnodes) {
    $free_condition = "1";
}

612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
# By default, include no wide area nodes when setting up the data structures.
#$free_condition = "($free_condition and ".
#    "(t.isremotenode=0 or ".
#    "dedicated_wa_types.attrvalue=1))";

# But if they have asked for widearea, we want this prepass to include
# these nodes.
#if ($widearea) {
#    $free_condition = "($free_condition or ".
#	"(t.isremotenode=1 and ".
#	"t.isvirtnode=0 and t.type!='pcfedphys' and ".
#	"dedicated_wa_types.attrvalue is NULL))";
#}


627
# In genimode exclude nodes with exclusion attribute.
628
if ($genimode ne $NO_GENI) {
629
630
631
632
    $free_condition = "($free_condition and ".
	"(nat1.attrvalue is null or nat1.attrvalue=0))";
}

633
634
635
636
if (defined($component_name)) {
    $free_condition = "(a.node_id = \"$component_name\")";
}

637
$result =
638
    DBQueryFatal("select a.node_id,a.type,a.phys_nodeid,t.class,t.issubnode," .
Leigh B. Stoller's avatar
Leigh B. Stoller committed
639
		 "a.def_boot_osid,(b.pid is not null and b.eid is not null), ".
640
		 "  np.reserved_pid is not null,np.eventstate, ".
Leigh B. Stoller's avatar
Leigh B. Stoller committed
641
642
		 "  np.battery_percentage,np.uuid,b.sharing_mode, ".
		 "  ru.load_1min, ru.load_5min, ru.status_timestamp, ".
643
		 "  a.def_boot_osid, nat2.attrvalue, wn.country, " .
644
                 "  wn.latitude, wn.longitude, t.isremotenode ".
645
		 "from nodes as a ".
646
647
		 "left join reserved as b on a.node_id=b.node_id ".
		 "left join reserved as m on a.phys_nodeid=m.node_id ".
648
		 "left join nodes as np on a.phys_nodeid=np.node_id ".
649
		 "left join node_types as t on t.type=a.type ".
650
651
652
653
654
655
		 "left join node_attributes as nat1 on ".
		 "     nat1.node_id=a.node_id and ".
		 "     nat1.attrkey='protogeni_exclude' ".
		 "left join node_attributes as nat2 on ".
		 "     nat2.node_id=a.node_id and ".
		 "     nat2.attrkey='shared_weight' ".
Leigh B. Stoller's avatar
Leigh B. Stoller committed
656
		 "left join node_rusage as ru on ru.node_id=a.node_id ".
657
658
659
660
661
662
		 "left outer join ". 
		 "  (select type,attrvalue ".
		 "   from node_type_attributes ".
		 "   where attrkey='dedicated_widearea' ".
		 "   group by type) as dedicated_wa_types ".
		 "  on t.type=dedicated_wa_types.type ".
663
                 "left join widearea_nodeinfo as wn on a.node_id=wn.node_id ".
664
		 "where $free_condition and ".
665
666
667
#		 "      a.role='testnode'"
		 "   (a.role='testnode' and (t.isremotenode=0 or ".
		 "                           dedicated_wa_types.attrvalue=1))");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
668

669
670
671
#
# Scan the results, checking permissions and adding to the list
# You get to use a node type if no pid was specified (that is, you get
672
673
674
# to use all nodes), or if there is no entry in the perms table for
# the type/class of node.
#
Timothy Stack's avatar
   
Timothy Stack committed
675
while (($node,$type,$physnode,$class,$issubnode,$def_boot_osid,$reserved,
Leigh B. Stoller's avatar
Leigh B. Stoller committed
676
	$prereserved,$eventstate,$battery_perc,$uuid,$sharing_mode,
677
	$load_1min,$load_5min,$load_tstamp,$osid,$weight,$country,$latitude,
678
679
680
681
682
683
684
685
        $longitude,$isremote) = $result->fetchrow_array) {
    my $current = $top->CreateNode($node);
    $current->SetSubnode($physnode, $issubnode);
    $current->SetRemote($isremote);

#    next
#	if ($isremote);

686
687
688
    $nodes{$node} = $type
	if (!defined($pid) ||
	    ($permissions{$type} && $permissions{$class}));
689
    $node_def_boot_osid{$node} = $def_boot_osid;
690
691
692
693
694
695

    if ($reserved) {
	$is_reserved{$node} = 1;
    } else {
	$is_reserved{$node} = 0;
    }
696
    if ($useshared && $sharing_mode) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
697
698
699
	$sharing_mode{$node} = { "load_1min"   => $load_1min,
				 "load_5min"   => $load_5min,
				 "load_tstamp" => $load_tstamp,
700
701
				 "osid"        => $osid,
				 "weight"      => $weight};
Leigh B. Stoller's avatar
Leigh B. Stoller committed
702
703
704
705
    }
    else {
	$sharing_mode{$node} = 0;
    }
Timothy Stack's avatar
   
Timothy Stack committed
706
707

    $is_prereserved{$node} = $prereserved;
708
709
710

    $curr_state{$node} = $eventstate;
    $curr_batt{$node} = $battery_perc;
711
712
713
714

    $node_countries{$node} = $country;
    $node_latitudes{$node} = $latitude;
    $node_longitudes{$node} = $longitude;
715
}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
716

717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
#
# Find out which nodes are connected to which, so that we can add some special
# features
#
$result = DBQueryFatal("SELECT DISTINCT node_id1, node_id2 " .
                       "  FROM wires");
my %connections = ();
while (my ($node_id1, $node_id2) = $result->fetchrow()) {
    foreach my $nodes ([$node_id1, $node_id2], [$node_id2, $node_id1]) {
        my ($node1, $node2) = @$nodes;
        if ($connections{$node1}) {
            # Check to see if we've already added this one (possible if the
            # nodes appeared in node1,node2 order, then node2,node1
            if (!grep(/^$node2$/, @{$connections{$node1}})) {
                push @{$connections{$node1}}, $node2;
            }
        } else {
            $connections{$node1} = [$node2];
        }
    }
}

739
740
741
742
743
744
@nodenames = keys(%nodes);
if ($randomize)
{
    @nodenames = shuffle(@nodenames);
}

745
746
747
#
# Loop through and print out all nodes
#
748
foreach $node (@nodenames) {
749
750
751
752
753
754
    my $current = $top->nodes()->{$node};

    # Wide area nodes are handled below
#    next
#	if ($current->is_remote());

755
756
757
    my $type  = $nodes{$node};
    my $class = $typemap{$type}->{'CLASS'};
    my $delay_capacity = $typemap{$type}->{'DELAYCAP'};
758
    my $simnode_capacity = $typemap{$type}->{'SIMCAP'};
759
760
    my $cpu_speed = $typemap{$type}->{'SPEED'};
    my $ram = $typemap{$type}->{'RAM'};
761
    my $trivspeed = $typemap{$type}->{'TRIVSPEED'};
762
    my $uuid = $nodetouuid{$node};
763
    
764
    my @types = ("$type:1");
765
    my @features = ();
766
    my @flags;
767
    my $needvirtgoo = 0;
768

769
770
    my ($latitude, $longitude, $country);

771
772
773
774
775
    # XXX temporary hack until node reboot avoidance 
    # is available. Nodes running the FBSD-NSE image
    # will have a feature def-osid-fbsd-nse 0.0
    # This is used by assign to prefer these pnodes
    # first before using others.
776
777
    if($node_def_boot_osid{$node} && ($node_def_boot_osid{$node} eq 
	TBOSID(TB_OPSPID, "FBSD-NSE"))) { 
778
779
780
	push(@features, "FBSD-NSE:0.0");
    }

781
782
783
784
785
786
787
788
789
    #
    # XXX: Temporary hack - don't march switches that are testnodes
    # as having class 'switch' - assign treats those specially. We
    # use the knowledge that 'real' switches don't hit this point!
    #
    if ($class eq "switch") {
	$class = $type;
    }
        
790
    # Might be equal, which assign would sum as two, not one!
791
792
    if ($type ne $class) {
	push(@types, "$class:1");
793
794
    }

795
    if (defined($delay_capacity) && $delay_capacity > 0) {
796
797
798
799
800
801
	# Comes from the NS file;
	$delay_capacity = $delaycap_override
	    if (defined($delaycap_override) &&
		$delaycap_override > 0 &&
		$delaycap_override < $delay_capacity);
	
802
	push @types, "delay:$delay_capacity";
803
	push @types, "delay-${type}:$delay_capacity";
804
    }
805

Leigh B. Stoller's avatar
Leigh B. Stoller committed
806
807
808
809
810
811
812
813
814
815
    #
    # Prototype shared mode.
    #
    if ($sharing_mode{$node}) {
	#
	# Add a feature that says this node should not be picked
	# unless the cooresponding desire is in the vtop. This
	# allows the node to be picked, subject to other type constraints.
	#
	push(@features, "pcshared:1.0");
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860

	#
	# The pool daemon may override the share weight.
	#
	if (defined($sharing_mode{$node}->{"weight"})) {
	    my $weight = $sharing_mode{$node}->{"weight"};
	    
	    push(@features, "shareweight:$weight");
	}
	else {
	    #
	    # The point of this feature is to have assign favor shared nodes
	    # that already have nodes on them, so that they are well packed.
	    # Shared nodes with just a few vnodes on them are avoided so that
	    # they will free up eventually. 
	    #
	    my $maxvnodes = 10;
	    my $weight    = 0.5;
	    my $gcount    = $globalcounts{$node} || 0.0;

	    foreach my $auxinfo (@{$auxtypes{$node}}) {
		my ($auxtype,$count) = split(":", $auxinfo);
		
		if ($auxtype eq "pcvm") {
		    $maxvnodes = $count;
		    last;
		}
	    }
	    #
	    # No point in the feature if no room left. 
	    #
	    if ($maxvnodes > $gcount) {
		my $factor = ($gcount / $maxvnodes);
		if ($factor < 0.25) {
		    $weight = 0.8;
		}
		elsif ($factor > 0.75) {
		    $weight = 0.1;
		}
		else {
		    $weight = 0.3;
		}
		#push(@features, "shareweight:$weight");
	    }
	}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
861
862
    }

863
864
865
    #
    # Add any auxiliary types
    #
866
867
868
    foreach my $auxinfo (@{$auxtypes{$node}}) {
	my ($auxtype,$count) = split(":", $auxinfo);
	my $realtype;
869

870
871
872
	# Map an auxtype back to its real type, unless it is a real type.
	if (defined($auxtypemap{$auxtype})) {
	    $realtype = $auxtypemap{$auxtype};
873
874
	}
	else {
875
	    $realtype = $auxtype;
876
	}
877
878
879
880

	if ($typemap{$realtype}->{'ISVIRT'} && $count > 0) {
	    next
		if (! $virtstuff);
881
882
883
884
885
886
887

	    #
	    # If the node is shared, must subtract the current global count
	    # from the max first, to see if there is any room left.
	    #
	    if ($sharing_mode{$node} && exists($globalcounts{$node})) {
		$count -= $globalcounts{$node};
888
	    }
889
890
	    if (defined($mfactor) && $mfactor <= $count) {
		$count = $mfactor;
891
	    }
892
	    $auxinfo = "$auxtype:$count";
893
	    $needvirtgoo = 1;
894
895
896
897
898
899
900
901
902
903
904

	    #
	    # Add in machine specific auxtypes that use the same count.
	    #
	    push(@types, "${type}-vm:$count");

	    # And a legacy type.
	    my $legacy_type = $type;
	    if (($legacy_type =~ s/pc/pcvm/)) {
		push(@types, "${legacy_type}:$count");
	    }
905
906
907
908
	}
	push(@types, $auxinfo);
    }

Timothy Stack's avatar
   
Timothy Stack committed
909
    if (defined($areamap{$node})) {
Timothy Stack's avatar
   
Timothy Stack committed
910
	push @features, $areamap{$node};
Timothy Stack's avatar
   
Timothy Stack committed
911
912
    }

913
    my $cpu_ram_features_present = 0;
914
915
916
917
    #
    # This stuff is extra goo for local virtual nodes.
    # 
    if ($needvirtgoo) {
918
	push @types, "*lan:*";
919
920
921
922
	# Add trivial bw spec., but only if the node type has it
	if ($trivspeed) {
	    push @flags, "trivial_bw:$trivspeed";
	}
923
924
925
926
927
928
	if (! $sharing_mode{$node}) {
	    # Add CPU and RAM information
	    $cpu_ram_features_present++;
	    # This number can be use for fine-tuning packing
	    push @features, "?+virtpercent:100";
	}
929
	# Put this silly feature in so that we can try to keep vnodes
930
931
932
933
	# on the same pnode they were before - but only if updating
        if ($exempt_eid) {
            push @features, "${node}:0.0";
        }
934
935
    }

936
    if ($simstuff && defined($simnode_capacity) && $simnode_capacity > 0) {
937
938
939
940
941
942
943
944
945
	#
	# Use user specified multiplex factor
	#
	if (defined($mfactor) && $mfactor <= $simnode_capacity) {
	    push @types, "sim:$mfactor";
	}
	else {
	    push @types, "sim:$simnode_capacity";
	}
946
	# Add CPU and RAM information
947
	$cpu_ram_features_present++;
948
949
950
951
	push @types, "*lan:*";
	# Add trivial bw spec.
	push @flags, "trivial_bw:100000";
    }
952
953
    if ($cpu_ram_features_present) {
	# Add CPU and RAM information
954
955
956
957
	push @features, "?+cpu:$cpu_speed"
	    if (defined($cpu_speed));
	push @features, "?+ram:$ram"
	    if (defined($ram));
958
959
	push @features, "?+cpupercent:92"; # XXX Hack
	push @features, "?+rampercent:80"; # XXX Hack
960
    }
961

962
    # Add features
963
964
965
966
967
    if (! $sharing_mode{$node}) {
	push(@features, @{$typemap{$type}->{'FEATURES'}});
	if (defined($features{$node})) {
	    push @features, @{$features{$node}};
	}
968
969
    }

970
    #
Leigh B. Stoller's avatar
Leigh B. Stoller committed
971
    # Add in OS features.
972
    #
Leigh B. Stoller's avatar
Leigh B. Stoller committed
973
974
975
976
977
978
979
980
    if ($sharing_mode{$node}) {
	#
	# A shared node is running just one OS, and we put that in
	# so that the user can specify which of the current VM types
	# is wanted.
	#
	my $osid = $sharing_mode{$node}->{'osid'};
	push(@features, "OS-$osid:0.5");
981
982
983
984
	# Add any subOSes the shared node osid can support
	if (defined($osid_subosids{$osid})) {
	    push (@features, map "OS-$osid-$_:0", @{$osid_subosids{$osid}});
	}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
985
986
987
988
989
990
    }
    elsif ($node_type_osids{$type}) {
	#
	# Add in features for all of the OSes that this node (as
	# evidenced by its type) can support
	#
991
992
993
994
995
996
	foreach my $o1 (@{$node_type_osids{$type}}) {
	    push @features, "OS-$o1:0";
	    foreach my $o2 (@{$osid_subosids{$o1}}) {
		push @features, "OS-$o1-$o2:0";
	    }
	}
997
    }
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
    elsif (! $typemap{$type}->{'IMAGEABLE'} &&
	   defined($typemap{$type}->{'OSID'})) {
	#
	# If node is not imageable (and thus no entries in osidtoimageid,
	# then assume it always has its default OSID loaded and ready to
	# go, so that assign will agree to the allocation (assign_wrapper
	# adds a desire that says it has to be running the OSID the user
	# has selected, or the default OSID from the node_types table).
	#
	push @features, map "OS-$_:0", $typemap{$type}->{'OSID'};
    }
1009

1010
    # Add features indicating what this node has connections to
1011
    if ($connections{$node} && !$sharing_mode{$node}) {
1012
1013
1014
1015
1016
1017
        my @connected_to  = @{$connections{$node}};
        foreach my $other_end (@connected_to) {
            push(@features,"connected-to-$other_end:0.0");
        }
    }

1018
1019
    # This is for the case that we are modifying an existing experiment - tell
    # assign to prefer nodes the user has already allocated
1020
    if ($exempt_eid && !$allnodes && $is_reserved{$node}) {
1021
1022
1023
	push(@features,"already_reserved:0");
    }

Timothy Stack's avatar
   
Timothy Stack committed
1024
1025
1026
1027
    if ($is_prereserved{$node}) {
	push(@features,"prereserved:0.9");
    }

1028
1029
1030
1031
1032
1033
1034
1035
1036
    # For robots, prefer ones that are already powered on and/or won't need to
    # be recharged soon.
    if (defined($curr_state{$node}) && ($curr_state{$node} eq TBDB_NODESTATE_POWEROFF)) {
	push(@features,"poweroff:0.9");
    }
    if (defined($curr_batt{$node})) {
	push(@features,"powerneeded:" . (1.0 - $curr_batt{$node} / 100.0));
    }

1037
1038
1039
    #
    # Handle subnodes
    #
1040
    if ($current->is_subnode()) {
1041
1042
	# We don't want to include subnodes unless their parent node is going
	# to be in the ptop file too
1043
1044
	if (!$nodes{$current->subnode_of()} ||
	    $sharing_mode{$current->subnode_of()}) {
1045
1046
1047
1048
	    # In fact, nuke it from %nodes so that we don't include its links,
	    # either
	    delete $nodes{$node};
	    next;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1049
	}
1050
	# Push the subnode's information into its flags
1051
	push @flags, "subnode_of:" . $current->subnode_of();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1052
    }
1053

1054
1055
1056
1057
1058
1059
1060
    #
    # Handle node locations
    #
    $country = $node_countries{$node};
    $latitude = $node_latitudes{$node};
    $longitude = $node_longitudes{$node};

1061
    my @parse_features = split(" ", join(" ", @features));
1062
    print_node($node, \@types, \@parse_features, \@flags, $uuid,
1063
1064
	       $nodetointerface{$node}, $country, $latitude, $longitude,
	       $type);
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1065
1066
}

1067
my @inet_protos = ("ipv4");
1068
if (($widearea && ! defined($component_name)) || $genimode ne $NO_GENI) {
1069
1070
1071
1072
1073
1074
1075
1076
    #
    # Set up 'the Internet' as a fake switch that all widearea nodes can
    # talk to.
    # Some day, it may make sense to connect control net ports to this
    # switch.
    #
    my @types = map("*$_:*", @inet_protos);
    print_node($fake_inet_switch, \@types, [], [], undef, [], undef, undef,
1077
        undef, undef);
1078
1079
}

1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
#
# Widearea Nodes. Includes plab nodes. Note that widearea nodes are never
# allocated directly (they are in a holding experiment), but assign deals
# with it by allocating multiple vnodes on a pnode.
#
# The underlying physnode has to be "up", as determined by the
# autostatus stuff; this will prevent us from allocating a dead
# virtual node to an experiment.  This is especially hacky. We need
# another mechanism for this. We only add virtnodes when assign says
# we need them. This reduces the problem size for assign.
#
1091
1092
1093
1094
# The types we lay out are only those in the auxtypes table for the node,
# since that is where we define what vtypes are hosted on a particular
# physnode. 
#
1095
if ($widearea && ! defined($component_name)) {
1096
1097
    #
    # Note - there is currently an assumption in this query that widearea nodes
1098
    # have only one control interface.
1099
    #
1100
    $result =
1101
	DBQueryFatal("select n.node_id,nt.type,ns.status,r.pid,r.eid,wn.site,".
1102
                     "wn.country,wn.latitude,wn.longitude, ".
1103
                     "i.iface,wn.bwlimit,n.uuid ".
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1104
1105
1106
1107
		     "from nodes as n ".
		     "left join node_types as nt on nt.type=n.type ".
		     "left join reserved as r on r.node_id=n.node_id ".
		     "left join node_status as ns on ns.node_id=n.node_id ".
1108
		     "left join widearea_nodeinfo as wn on ".
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1109
		     "     wn.node_id=n.node_id ".
1110
		     "left join interfaces as i on ".
1111
		     "     n.node_id=i.node_id and ".
1112
1113
1114
1115
1116
1117
1118
		     "     i.role='" . TBDB_IFACEROLE_CONTROL() . "' ".
		     "left outer join ". 
		     "  (select type,attrvalue ".
		     "   from node_type_attributes ".
		     "   where attrkey='dedicated_widearea' ".
		     "   group by type) as dedicated_wa_types ".
		     "  on nt.type=dedicated_wa_types.type ".
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1119
		     "where  (n.role='testnode' and nt.isremotenode=1 and ".
1120
		     "        nt.isvirtnode=0 and nt.type!='pcfedphys' and ".
1121
		     "        dedicated_wa_types.attrvalue is NULL)");
1122
    
1123
1124
    while (($physnode,$ptype,$status,$mpid,$meid,$site,$country,$latitude,
            $longitude,$iface,$bwlimit,$uuid)
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1125
	   = $result->fetchrow_array) {