assign_wrapper.in 73.6 KB
Newer Older
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1
2
#!/usr/bin/perl -w

Leigh B. Stoller's avatar
Leigh B. Stoller committed
3
4
#
# EMULAB-COPYRIGHT
Leigh B. Stoller's avatar
Leigh B. Stoller committed
5
# Copyright (c) 2000-2003 University of Utah and the Flux Group.
Leigh B. Stoller's avatar
Leigh B. Stoller committed
6
7
8
# All rights reserved.
#

Leigh B. Stoller's avatar
Leigh B. Stoller committed
9
10
11
12
13
14
15
16
17
18
19
20
21
22
# This function as the main assign loop.  It converts the virtual
# topology into a top input including LAN and delay translation.  It
# then snapshots the current testbed physical state and runs assign,
# looping a couple times if assign fails.  When assign successfully
# completes it will interpret the results.  Attempt to match any
# existing portmap entries and then update the delays and vlans table.

# Syntax: assign_wrapper <pid> <eid>

# Caveats:
#  The support for direct and interswitch links has not been testbed much.

# Settings
# delaythresh is the maximum delay in ms above which a delay node is needed.
23
#  (Note that the DB represents delays as floating point numbers)
Leigh B. Stoller's avatar
Leigh B. Stoller committed
24
# maxrun is maximum number of times we run assign.
25
26
# delaywithswitch if 1 will use the switch to delay when possible.  Currently
#  this only works for 10mbit links.
27
$delaythresh = 2;
28
$maxrun = 20;
29
$delaywithswitch=0;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
30

31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
#
# Some handy constants. Speed in Mbits/sec and Kbits/sec units.
# The conversion routine is to make explicit that we operate with two
# different sets of units. One is the topology, which is in Kbps now.
# The second is the physical description, which has been changed to
# Kbps in the DB (and in ptopgen).
#
# Its probably a good idea to leave portbw (current_speed) in Mbs, since
# those numbers are used at the switch and the interfaces, which really
# only think in Mbps.
#
my $S10Mbs  = 10;
my $S100Mbs = 100;
my $S10Kbs  = 10000;
my $S100Kbs = 100000;
sub BWConvert($) {
    #
    # Use this if physical units are in Mbs (used to be).
    #
    #my $bw = $_[0] / 1000;
    
    my $bw = $_[0];
    return $bw;
}

56
$DELAYCAPACITY = @DELAYCAPACITY@;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
57
$TBROOT = "@prefix@";
58
$ENV{'PATH'} = "/usr/bin:$TBROOT/libexec:$TBROOT/sbin:$TBROOT/bin";
59

60
61
use lib '@prefix@/lib';
use libdb;
62
use libtestbed;
63
require exitonwarn;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
64

65
66
67
68
69
#
# Turn off line buffering on output
#
$| = 1;

70
71
use Getopt::Std;

Chad Barb's avatar
   
Chad Barb committed
72
getopts('vu',\%opt);
73
74
75
76

sub usage {
	print "Usage: $0 [-v] pid eid\n";
	print "		-v enables verbose output\n";
Chad Barb's avatar
   
Chad Barb committed
77
	print "         -u enables update functionality\n";
78
	exit(-1);
79
}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
80

81
my $verbose = 0;
Chad Barb's avatar
   
Chad Barb committed
82
83
my $updating = 0;

84
if ($opt{v}) {
Chad Barb's avatar
   
Chad Barb committed
85
86
87
88
89
    $verbose = 1;
}

if ($opt{u}) {
    $updating = 1;
90
91
92
}

if (@ARGV != 2) {
Chad Barb's avatar
   
Chad Barb committed
93
    usage();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
94
}
95

Leigh B. Stoller's avatar
Leigh B. Stoller committed
96
97
98
99
100
101
102
103
104
105
($pid,$eid) = @ARGV;

$ptopfile = "$pid-$eid-$$.ptop";

sub printdb {
    if ($verbose) {
	print $_[0];
    }
};

106
107
TBDebugTimeStamp("assign_wrapper started");

Leigh B. Stoller's avatar
Leigh B. Stoller committed
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
######################################################################
# Step 1 - Setup virtual topology
#
# Here we need to read the virtual topology in from the virt_nodes
# and virt_lans table.  We then need to add delay and lan nodes as
# necessary.
#
# Conversion details:
#   Let L be a LAN with N members.
#   If N == 2 
#      Let N1 be node 1
#      Let N2 be node 2
#      If L is delayed
#         Generate delay node D
#         Link N1 to D
#         Link N2 to D
#      Else
#         Link N1 to N2
#   Else
#      Generate lan node A
#      If L is delayed
#        Foreach node N in L
#           Generate delay node DN
#           Link A to DN
#           Link N to DN
#      Else
#        Foreach node N in L
#           Link N to A
#
# Datastructures:
#  nodes is indexed by virtual node and contains the node type.
139
140
#  isremotenode is indexed by virtual node and says whether the node is
#    is remote. We let wanassign deal with those nodes.
Leigh B. Stoller's avatar
Leigh B. Stoller committed
141
142
143
144
#  nodelans is indexed by virtual node and contains a list of
#    <port>:<lan> that it is connected to.
#  ips is indexed by nodeport and contains the IP addresses.
#  lannodes is indexed by physical name is the set of lan nodes.
145
#  portbw is indexed by virtual nodeport and contains the bandwidth
146
147
148
149
#    of that port. Note that port bandwidth in the interfaces table is
#    left in Mbps units for now. Thats inconsistent, I know. For LANs with
#    other bandwidths the port speed will be 100 and a delay node will
#    be inserted.
150
151
#  fixed_nodes is indexed by virtual node name and points to physical node
#   name.
Christopher Alfeld's avatar
Christopher Alfeld committed
152
#  vtypes is indexed by vtype name and is a list of {weight types}.
Leigh B. Stoller's avatar
Leigh B. Stoller committed
153
154
155
156
157
158
159
160
161
#
# Delay node names:
#  delay nodes are named tbdelayXX N > 2
#   and tbsdelayXX for N == 2.
# 
# Lan node nameS:
#  lan nodes are named lan/<virtual lan>
######################################################################

162
163
164
printdb "Generating TOP file.\n";
TBDebugTimeStamp("top started");

Leigh B. Stoller's avatar
Leigh B. Stoller committed
165
166
167
168
169
170
171
172
173
174
# Shark Hack
# For each LAN we replace all the sharks in the LAN with a single
# shark shelf node.  After this goes through assign we pull them
# all back out.
#
# sharkshelves is indexed by virtual shelf name and is a list of
# the virtual nodes in it.
# sharkshelfid is used to generate ids for shark shelves.
$sharkshelfid = 0;

175
# lans is indexed by virtual lan and is a list of nodeport members.
176
177
178
# emulated is 1 if the link/lan is emulated (virtual). This is
# controlled by the a variable in the virt_lans table. It also gets
# set when one of the nodes in the lan is a virtnode (jail).
179
180
181
my %lans     = ();
my %emulated = ();

182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
# delayinfo stores the virt_lans info, and is indexed by virtual
# lan:node:port and is a list of delay, bandwidth, lossrate, rdelay,
# rbandwidth, rlossrate.  Where r* indicates switch->node and the
# others indicate node->switch.
my %delayinfo = ();

# queueinfo overlaps with delayinfo. It came later, and I added before
# I understood this stuff. It should be merged into delayinfo above.
# It holds the q_ stuff from virt_lans. 
my %queueinfo = ();

# delaylinks stores the actual link delay info, converted from the
# virt delay params above. It is indexed by link name and contains
# [delay,bw,loss] for each direction. 
my %delaylinks = ();

# delaynodes stores the names of delaynodes that we create on the
# fly using delayid. This is useful for doing isdelay? tests.
my %delaynodes = ();
my $delayid    = 0;

# nodedelays and linkdelays are the final (!) representation. Indexed by
# integer id, they store the physical node info and the delay info. 
my %nodedelays = ();
my %linkdelays = ();

# Set this when forcing linkdelays instead of delay nodes. Set in the NS
# file with a tb-compat directive. The force directive says to set up a
# link delay, even when no delay would otherwise be inserted. 
my $uselinkdelays   = 0;
my $forcelinkdelays = 0;

214
215
216
217
# And the per-lan control, based on the above two variables, and
# per-lan variable in the virt_lans table. Indexed by lan name.
my %uselinkdelay    = ();

218
219
220
221
my $query_result =
    DBQueryFatal("SELECT uselinkdelays,forcelinkdelays from experiments ".
		 "where pid='$pid' and eid='$eid'");
($uselinkdelays,$forcelinkdelays) = $query_result->fetchrow_array();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
222

223
224
225
# Figure out what kind of links we have. Indexed by bandwidth and is
# just a set.
my %okbandwidths = ();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
226

227
228
$query_result =
    DBQueryFatal("SELECT type,max_speed from interface_types");
229

230
while (($type,$bandwidth) = $query_result->fetchrow_array()) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
231
232
    $okbandwidths{$bandwidth} = 1;
}
233
234
235

# Load delay osids and default osids for types
my %delayosids   = ();
236
my %jailosids    = ();
237
238
239
240
241
242
my %defaultosids = ();

$query_result =
    DBQueryFatal("SELECT type,delay_osid,osid from node_types");

while (($type,$delayosid,$defosid) = $query_result->fetchrow_array()) {
243
244
    $delayosids{$type}   = $delayosid;
    $jailosids{$type}    = "emulab-ops-FBSD47-JAIL";
245
246
    $defaultosids{$type} = $defosid;
}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
247

Shashi Guruprasad's avatar
Shashi Guruprasad committed
248
249
250
251
# XXX NSE hack: List of simulated nodes. All these are gonna go
# into one pc850. Needs to change in distributed nse
my @simnodelist;
my %simnode_iplist = ();
252
253
my %iptonodemap    = ();
my $nsenode_id     = 0;
Shashi Guruprasad's avatar
Shashi Guruprasad committed
254

Leigh B. Stoller's avatar
Leigh B. Stoller committed
255
256
257
# XXX Remote/Virt node hacks. Turns out to be similar to NSE.
my %isremotenode = ();
my %isvirtnode   = ();
258
259
my $remotecount  = 0;
my $virtcount    = 0;
260
my $virtnode_id  = 0;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
261

Chad Barb's avatar
   
Chad Barb committed
262
263
my %alreadyAllocated = ();

Chad Barb's avatar
   
Chad Barb committed
264
265
266
267
268
269
270
271
if ($updating) {
    printdb "Fixing previously allocated nodes.\n";
	$result = 
	    DBQueryFatal("SELECT vname, node_id ".
			 "FROM reserved ".
			 "WHERE pid='$pid' AND eid='$eid'");
    
    while (($vname,$reserved) = $result->fetchrow_array) {
Chad Barb's avatar
   
Chad Barb committed
272
273
274
	$reserved_nodes{$vname} = $reserved;
	$fixed_nodes{$vname}    = $reserved;    
	$alreadyAllocated{$reserved} = "unused";
Chad Barb's avatar
   
Chad Barb committed
275
276
277
278
279
    }
    $result->finish;
}


Leigh B. Stoller's avatar
Leigh B. Stoller committed
280
printdb "Loading virt_nodes.\n";
281
$result =
Chad Barb's avatar
   
Chad Barb committed
282
    DBQueryFatal("select distinct vn.vname,vn.ips,vn.type,vn.fixed, ".
Chad Barb's avatar
   
Chad Barb committed
283
		 " nt.isremotenode,nt.isvirtnode ".
284
285
286
		 " from virt_nodes as vn ".
		 "left join node_types as nt on ".
		 " nt.type=vn.type or nt.class=vn.type ".
Chad Barb's avatar
   
Chad Barb committed
287
288
		 "where vn.pid='$pid' and vn.eid='$eid' ".
		 "order by vn.vname");
Chad Barb's avatar
   
Chad Barb committed
289

Chad Barb's avatar
   
Chad Barb committed
290
while (($vname,$ips,$type,$fixed,$isremote,$isvirt) = 
Chad Barb's avatar
   
Chad Barb committed
291
        $result->fetchrow_array){
Leigh B. Stoller's avatar
Leigh B. Stoller committed
292
293
294
295
    if (defined($fixed) && $fixed eq "") {
	undef($fixed);
    }
    
296
    # REMOTENODE HACK
297
    #
298
    # if its a vtype, no entry in node_types. vtypes break remote nodes.
299
300
301
    # Need to look inside the vtype and make sure no mixing of vnodes and
    # physnodes. Later ...
    #
302
    if (! defined($isremote)) {$isremote = 0;}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
303
304
305
306
    if (! defined($isvirt)) {$isvirt = 0;}
    
    printdb "  $vname $type $ips";
    printdb " " . (defined($fixed) ? $fixed : "") . " $isremote\n";
307
    
Leigh B. Stoller's avatar
Leigh B. Stoller committed
308
309
310
311
312
313
314
315
316
317
    # We need to check the names to make sure they won't clash with
    # our internal delay node names.
    if (($vname =~ /^tbdelay\d+/) ||
	($vname =~ /^tbsdelay\d+/)) {
	print STDERR "Warning: $vname is a reserved name.  Working around.\n";
	($num) = ($vname =~ /(\d+)/);
	$delayid = $num + 1;
    }
    $nodes{$vname} = $type;
    $nodelans{$vname} = [];
318

Shashi Guruprasad's avatar
Shashi Guruprasad committed
319
320
321
322
    if( $type eq "sim" ) {
      push( @simnodelist, $vname );
      $simnode_iplist{$vname} = [];
    }    
323
    # REMOTENODE HACK
324
    # 
325
    $isremotenode{$vname} = $isremote;
326
327
    $remotecount++
	if ($isremote);
328
329
330
    foreach $ipinfo (split(" ",$ips)) {
	($port,$ip) = split(":",$ipinfo);
	$ips{"$vname:$port"} = $ip;
Shashi Guruprasad's avatar
Shashi Guruprasad committed
331
332
333
334
	if( $type eq "sim" ) {
	  push(@{$simnode_iplist{$vname}}, $ip);
	}
	$iptonodemap{$ip} = $vname;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
335
    }
Leigh B. Stoller's avatar
Leigh B. Stoller committed
336
    $isvirtnode{$vname} = $isvirt;
337
338
    $virtcount++
	if ($isvirt);
Chad Barb's avatar
   
Chad Barb committed
339

Leigh B. Stoller's avatar
Leigh B. Stoller committed
340
    if (defined($fixed)) {
341
342
	$fixed_nodes{$vname} = $fixed;
    }
Leigh B. Stoller's avatar
Leigh B. Stoller committed
343
}
344
$result->finish;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
345
346

printdb "Loading virt_lans.\n";
347
348
$result =
    DBQueryFatal("select vname,member,delay,bandwidth,lossrate," .
349
350
		 "rdelay,rbandwidth,rlossrate,widearea, ".
		 "emulated,uselinkdelay " .
Chad Barb's avatar
   
Chad Barb committed
351
352
		 "from virt_lans where pid='$pid' and eid='$eid' ".
                 "order by vname,member");
353
354

#
355
# REMOTENODE HACK: Remote nodes are special.
356
#
357
# A list of all lans that have remote nodes as members,
358
my %rnodelans = ();
359
360
361
# A list of all the tunnels we need to build. Each list member is a list
# of the nodes in the tunnel.
my %tunnels   = ();
362
363

#
364
# Process the virt_lans table.
365
# 
366
367
368
369
while (my ($vname,$member,$delay,$bandwidth,$lossrate,
	   $rdelay,$rbandwidth,$rlossrate,$widearea,
	   $isemulated,$uselinkdelay) = $result->fetchrow_array) {
    my ($node,$port) = split(":",$member);
370
371

    #
372
    # REMOTENODE HACK: 
373
    #
374
    # If its a duplex link involving a remotenode, skip it. 
375
    # We do not want to have assign deal with these. The nodes are
376
377
    # allocated as unconnected by another program, and we deal with
    # it later by creating tunnels.
378
    # 
379
    if ($widearea) {
380
381
382
383
	if (! defined($tunnels{$vname})) {
	    $tunnels{$vname} = [];
	}
	push(@{$tunnels{$vname}},$member);
384
	$rnodelans{$vname} = 1;
385
386
	printdb "    Added $member to tunnels of $vname\n";
	next;
387
388
    }
    
Leigh B. Stoller's avatar
Leigh B. Stoller committed
389
390
391
392
    if (! defined($lans{$vname})) {
	$lans{$vname} = [];
    }
    push(@{$lans{$vname}},$member);
Christopher Alfeld's avatar
Christopher Alfeld committed
393
394
    $delayinfo{"$vname:$member"} = [$delay,$bandwidth,$lossrate,
				    $rdelay,$rbandwidth,$rlossrate];
395
396
397
398
399
400
401
402
403

    #
    # Grab the Q stuff from virt_lans. I'm keeping this separate for
    # now until I understand whats going on. There are no "r" params
    # either. I have no idea how do to this stuff for lans, and for
    # duplex links the "r" params are not necessary. Each virt_lans
    # entry gives the params towards the switch, which equal the
    # reverse params for the other member. 
    #
404
    $query_result =
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
	DBQueryFatal("select q_limit,q_maxthresh,q_minthresh,q_weight, ".
		     "       q_linterm,q_qinbytes,q_bytes,q_meanpsize, ".
		     "       q_wait,q_setbit,q_droptail,q_red,q_gentle ".
		     "from virt_lans ".
		     "where pid='$pid' and eid='$eid' and ".
		     "      vname='$vname' and member='$member'");
    
    my ($q_limit,$q_maxthresh,$q_minthresh,$q_weight,$q_linterm,
	$q_qinbytes,$q_bytes,$q_meanpsize,$q_wait,$q_setbit,
	$q_droptail,$q_red,$q_gentle) = $query_result->fetchrow_array;
    
    $queueinfo{"$vname:$member"} =
	[$q_limit,$q_maxthresh,$q_minthresh,$q_weight,$q_linterm,
	 $q_qinbytes,$q_bytes,$q_meanpsize,$q_wait,$q_setbit,
	 $q_droptail,$q_red,$q_gentle];

    if ($q_red) {
	$mustdelay{$vname} = 1;
    }
424
425
    $emulated{$vname} = $isemulated;
    $uselinkdelay{$vname} = $uselinkdelay;
426
    
427
428
429
430
431
432
433
434
435
436
437
438
    #
    # XXX - Whenever a delay node is inserted, port speeds are set to
    #       100Mbs, even if they requested exactly 10Mbs. This is a
    #       simplification. At some point we might want to force all the
    #       ports along the way to 10Mbs, and have the delay node worry
    #       about delay only, and not bandwidth. That will be harder to
    #       to do in this mess. See companion XXX below where the delays
    #       table is initialized. Initially, we set the speed to 10Mbs,
    #       if a delay node is insterted below, it resets this to 100Mbs.
    # 
    if ($bandwidth == $S10Kbs && $delaywithswitch) {
	$portbw{$member} = $S10Mbs;
439
    } else {
440
	$portbw{$member} = $S100Mbs;
441
    }
Leigh B. Stoller's avatar
Leigh B. Stoller committed
442
    push(@{$nodelans{$node}},"$port:$vname");
443
    printdb "  portbw of $member = $portbw{$member}\n";
Christopher Alfeld's avatar
Christopher Alfeld committed
444
    printdb "  $vname $member - $delay $bandwidth $lossrate $rdelay $rbandwidth $rlossrate\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
445
446
    printdb "    Added $port:$vname to nodelans of $node\n";
}
447
$result->finish;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
448

449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
#
# Check event list. Anytime we find an event to control a link, we need
# to drop a delay node in. start/stop especially, since thats the easiest
# way to do that, even if the link has no other traffic shaping in it. 
# 
printdb "Checking events for LINK commands.\n";
$result =
    DBQueryFatal("select distinct vname from eventlist as ex ".
		 "left join event_eventtypes as et on ex.eventtype=et.idx ".
		 "left join event_objecttypes as ot on ex.objecttype=ot.idx ".
		 "where ot.type='LINK' and ex.pid='$pid' and ex.eid='$eid'");
while (($vname) = $result->fetchrow_array) {
    $mustdelay{$vname} = 1;
}

Leigh B. Stoller's avatar
Leigh B. Stoller committed
464
465
466
467
468
469
470
# Shark hack
foreach $lan (keys(%lans)) {
    $realmembers = [];
    $sharks = [];
    $hassharks = 0;
    foreach $member (@{$lans{$lan}}) {
	($node) = (split(":",$member))[0];
471
	if (($nodes{$node} eq "shark") || ($nodes{$node} eq "dnard")) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
472
473
474
475
476
477
478
479
480
481
482
483
	    push(@$sharks,$member);
	    $hassharks = 1;
	} else {
	    push(@$realmembers,$member);
	}
    }
    if ($hassharks) {
	$shelfid = "sharkshelf$sharkshelfid";
	printdb "  Creating shark shelf: $shelfid (" . 
	    join(" ",@$sharks) . ")\n";
	$sharkshelfid++;
	$sharkshelves{$shelfid} = $sharks;
484
	$delayinfo{"$lan:$shelfid:uplink"} = [0,$S100Kbs,0.0,
485
					      0,$S100Kbs,0.0];
Leigh B. Stoller's avatar
Leigh B. Stoller committed
486
487
488
489
490
491
492
	push(@$realmembers,"$shelfid:uplink");
	$nodes{$shelfid} = "shark-shelf";
    }
    $lans{$lan} = $realmembers;
}
# End shark hack

Christopher Alfeld's avatar
Christopher Alfeld committed
493
494
495
496
497
498
499
500
501
# Load virt types
printdb "Loading virt_vtypes.\n";
$result = DBQueryFatal("SELECT name,weight,members from virt_vtypes" .
		       " where pid=\"$pid\" and eid=\"$eid\"");
while (($name,$weight,$types) = $result->fetchrow_array) {
    printdb "  $name $weight $types\n";
    $vtypes{$name} = "$weight $types";
}

Leigh B. Stoller's avatar
Leigh B. Stoller committed
502
# Open the TOP file
503
$topfile = "$eid.top";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
504
open(TOPFILE,"> $topfile") || do {
505
506
    die("*** $0:\n".
	"    Could not open $topfile.\n");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
507
508
};

Christopher Alfeld's avatar
Christopher Alfeld committed
509
510
511
512
# Print out vtypes
foreach $vtype (keys(%vtypes)) {
    print TOPFILE "make-vclass $vtype $vtypes{$vtype}\n";
}
513
514
515

$nodes=0;

Leigh B. Stoller's avatar
Leigh B. Stoller committed
516
517
foreach $node (keys(%nodes)) {
    # Shark hack
518
    if (($nodes{$node} ne "shark") &&
519
	($nodes{$node} ne "dnard") && !$isremotenode{$node}) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
520
	print TOPFILE "node $node $nodes{$node}\n";
521
522
523
	if ($nodes{$node} ne "shark-shelf") {
	    $nodes++;
	}
Leigh B. Stoller's avatar
Leigh B. Stoller committed
524
525
526
527
    }
    # End Shark hack
}

Shashi Guruprasad's avatar
Shashi Guruprasad committed
528
529
530
531
#
# lans that have simulated nodes
my %simnodelans = ();

Leigh B. Stoller's avatar
Leigh B. Stoller committed
532
533
foreach $lan (keys(%lans)) {
    @members = @{$lans{$lan}};
534
    printdb "$lan - " . join(" ",@members) . "\n";
535
536
537
    # Shark hack for rvr
    $sharks = 0;
    $nonsharks = 0;
Shashi Guruprasad's avatar
Shashi Guruprasad committed
538
539
    $simnodes = 0;
    $realnodes = 0;
540
541
542
    my $emulated = $emulated{$lan};
    my $uselinkdelay = $uselinkdelay{$lan};
    my $mustdelay = $mustdelay{$lan};
543
    $trivial_ok = 0;
544
545
546
547
    foreach $member (@members) {
	($node) = (split(":",$member))[0];
	if ($nodes{$node} eq "shark-shelf") {
	    $sharks++;
548
	} elsif ($nodes{$node} eq "sim") {
Shashi Guruprasad's avatar
Shashi Guruprasad committed
549
550
	    $simnodes++;
	    $simnodelans{$lan} = 1;
551
	} else {
552
	    # We always use an emulated link when its a virtnode.
553
554
	    if ($isvirtnode{$node}) {
		$emulated++;
555
		$emulated{$lan} = 1;
556
	    }
557
	    $nonsharks++;
Shashi Guruprasad's avatar
Shashi Guruprasad committed
558
	    $realnodes++;
559
560
	}
    }
561
562
563
564
565
566
567
    #
    # Hmm, no emulated lans for now. 
    #
    if ($emulated && @members > 2) {
	die("*** $0:\n".
	    "    Emulated lans ($lan) not allowed yet! Only links.\n");
    }
568
569
570
    if ($simnodes > 0 && $realnodes == 0 && $sharks == 0) {
	$trivial_ok = 1;
    }
Leigh B. Stoller's avatar
Leigh B. Stoller committed
571
572
573
574
    if ($#members == 1) {
	($nodeport0,$nodeport1) = @members;
	$node0 = (split(":",$nodeport0))[0];
	$node1 = (split(":",$nodeport1))[0];
Christopher Alfeld's avatar
Christopher Alfeld committed
575
576
577
578
579
580
581
582
583
584
585
586
587
	($delay0,$bw0,$loss0,
	 $rdelay0,$rbw0,$rloss0) = @{$delayinfo{"$lan:$nodeport0"}};
	($delay1,$bw1,$loss1,
	 $rdelay1,$rbw1,$rloss1) = @{$delayinfo{"$lan:$nodeport1"}};
	# Here the r's aregoing to be 1->0 and the others 0->1
	$delay = $delay0+$rdelay1;
	$loss = 1-(1-$loss0)*(1-$rloss1);
	$bw = &min($bw0,$rbw1);
	$rdelay = $rdelay0+$delay1;
	$rloss = 1-(1-$rloss0)*(1-$loss1);
	$rbw = &min($rbw0,$bw1);
	$bandwidth = &getbandwidth(&min($bw0,$rbw1));
	$rbandwidth = &getbandwidth(&min($rbw0,$bw1));
Shashi Guruprasad's avatar
Shashi Guruprasad committed
588
	if (((($delay >= $delaythresh) ||
589
590
591
592
593
594
595
596
597
598
599
600
601
	      (($bw != $S100Kbs) && ($bw != $S10Kbs)) ||
	      (($delaywithswitch == 0) && 
	       (($bw != $S100Kbs) && (($sharks == 0) || ($nonsharks > 1)))) || 
	      ($loss != 0)) ||
	     (($rdelay >= $delaythresh) ||
	      (($rbw != $S100Kbs) && ($rbw != $S10Kbs)) ||
	      (($delaywithswitch == 0) && 
	       (($rbw != $S100Kbs) && (($sharks == 0) || ($nonsharks > 1))))|| 
	      ($rloss != 0)) ||
	     # Link must be shaped for other reasons (q_red).
	     $mustdelay ||
	     # Global force, or per-link force. 
	     $forcelinkdelays || $uselinkdelay) &&
602
603
604
605
	    # XXX simulated nodes hack. We don't want to put delay nodes
	    # between simulated nodes. If there is a link between a
	    # simulated and a real node, we might need to put in delay
	    # nodes
606
607
608
609
610
611
612
613
614
	    ($realnodes != 0)) {
	    #
	    # We use a linkdelay if the link is emulated, globally forced,
	    # globally preferred if the link is shaped, or if the per-link
	    # flag was set (which means to put in a link delay regardless
	    # of whether the link is shaped).
	    #
	    if ($emulated ||
		$forcelinkdelays || $uselinkdelays || $uselinkdelay) {
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
		my $plink = "linksimple/$lan/$nodeport0,$nodeport1";
		
		$delaylinks{$plink} = [$nodeport0,$delay,$bw,$loss,
				       $nodeport1,$rdelay,$rbw,$rloss];
	    
		print(TOPFILE "link $plink $node0 $node1 ".
		      max($bw,$rbw) . " 0 0" .
		      ($emulated ? " emulated\n" : "\n"));

		printdb "Delay link $plink = " . 
		    join(" ",@{$delaylinks{$plink}}) . "\n";
	    }
	    else {
		my $delayname = "tbsdelay" . $delayid++;
		my $plink     = "linksdelaysrc/$lan/$nodeport0,$nodeport1";
		
		$delaylinks{$plink} = [$nodeport0,$delay,$bw,$loss,
				       $nodeport1,$rdelay,$rbw,$rloss];

		print TOPFILE "node $delayname delay\n";
		print TOPFILE "link linksdelaysrc/$lan/$nodeport0,$nodeport1 ".
		    "$node0 $delayname $bandwidth 0 0\n";
		print TOPFILE "link linksdelaydst/$lan/$nodeport1,$nodeport0 ".
		    "$node1 $delayname $bandwidth 0 0\n";

		$delaynodes{$delayname} = $delayname;
		
		printdb "Delay node $plink ($delayname) = " . 
		    join(" ",@{$delaylinks{$plink}}) . "\n";
	    }
645
646
647
648
649
650
651
652
	    #
	    # Ports are set to 100Mbs when a link gets a delay node.
	    # This can override initialization above cause we could not
	    # tell earlier if the link was going to get a real delay node
	    # or just a delaywithswitch.
	    #
	    $portbw{$nodeport0} = $S100Mbs;	    
	    $portbw{$nodeport1} = $S100Mbs;	    
Leigh B. Stoller's avatar
Leigh B. Stoller committed
653
	} else {
654
655
656
657
658
	    print TOPFILE "link linksimple/$lan/$nodeport0,$nodeport1 ".
		"$node0 $node1 $bandwidth 0 0";
	    if ($emulated) {
		print TOPFILE " emulated";
	    }
659
660
661
	    if ($trivial_ok) {
		print TOPFILE " trivial_ok";
	    }
662
	    print TOPFILE "\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
663
	}
664
    } elsif ($#members != 0) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
665
666
667
	print TOPFILE "node lan/$lan lan\n";
	$lannodes{"lan/$lan"} = 1;
	foreach $member (@members) {
Christopher Alfeld's avatar
Christopher Alfeld committed
668
669
	    ($delay,$bw,$loss,
	     $rdelay,$rbw,$rloss) = @{$delayinfo{"$lan:$member"}};
Leigh B. Stoller's avatar
Leigh B. Stoller committed
670
	    $bandwidth = &getbandwidth($bw);
Christopher Alfeld's avatar
Christopher Alfeld committed
671
	    $rbandwidth = &getbandwidth($rbw);
Leigh B. Stoller's avatar
Leigh B. Stoller committed
672
	    ($node) = (split(":",$member))[0];
673
674
# XXX The expression below should be modified for better bandwidth support.
# Probably needs to happen post assign somehow.
Shashi Guruprasad's avatar
Shashi Guruprasad committed
675
	    if (((($delay >= $delaythresh) ||
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
		  (($bw != $S100Kbs) && ($bw != $S10Kbs))  ||
		  (($delaywithswitch == 0) && 
		   (($bw != $S100Kbs) && (($sharks == 0) ||
					  ($nonsharks > 1)))) ||
		  ($loss != 0)) || 
		 (($rdelay >= $delaythresh) ||
		  (($rbw != $S100Kbs) && ($rbw != $S10Kbs))  ||
		  (($delaywithswitch == 0) && 
		   (($rbw != $S100Kbs) && (($sharks == 0) ||
					   ($nonsharks > 1)))) ||
		  ($rloss != 0)) ||
		 # Link must be shaped for other reasons (q_red).
		 $mustdelay ||
		 # Global force, or per-lan force. 
		 $forcelinkdelays || $uselinkdelay) &&
691
692
		# if we have 1 real node in the LAN, we may need to create
		# a lan
693
694
695
696
697
698
699
700
701
702
703
		($realnodes != 0)) {
		#
		# We use a linkdelay if the link is emulated, globally forced,
		# globally preferred if the link is shaped, or if the per-link
		# flag was set (which means to put in a link delay regardless
		# of whether the link is shaped).
		#
		# NB: Emulated lans not supported at this time. Caught above.
		#
		if ($emulated ||
		    $forcelinkdelays || $uselinkdelays || $uselinkdelay) {
704
705
706
707
708
709
710
		    my $plink = "linklan/$lan/$member";
		    
		    $delaylinks{$plink} =
			[$member,$delay,$bw,$loss,
			 $member,$rdelay,$rbw,$rloss];

		    print(TOPFILE "link $plink $node lan/$lan " .
711
			  max($bw,$rbw) . " 0 0" .
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
			  ($emulated ? " emulated\n" : "\n"));

		    printdb "Delay link $plink = " .
			    join(" ", @{$delaylinks{$plink}}) . "\n";
		}
		else {
		    my $delayname = "tbdelay" . $delayid++;
		    my $plink     = "linkdelaysrc/$lan/$member";

		    $delaylinks{$plink} =
			[$member,$delay,$bw,$loss,
			 $member,$rdelay,$rbw,$rloss];
		    
		    print TOPFILE "node $delayname delay\n";
		    print TOPFILE "link linkdelaysrc/$lan/$member" .
			" $node $delayname $bandwidth 0 0\n";
		    print TOPFILE "link linkdelaydst/$lan/$member" .
			" lan/$lan $delayname $bandwidth 0 0\n";
		    
		    $delaynodes{$delayname} = $delayname;

		    printdb "Delay node $plink ($delayname) = " .
			    join(" ", @{$delaylinks{$plink}}) . "\n";
		}
736
737
738
739
740
741
742
		#
		# Port is set to 100Mbs when the link gets a delay node.
		# This can override initialization above cause we could not
		# tell earlier if the link was going to get a real delay node
		# or just a delaywithswitch.
		#
		$portbw{$member} = $S100Mbs;	    
Leigh B. Stoller's avatar
Leigh B. Stoller committed
743
744
	    } else {
		print TOPFILE "link linklan/$lan/$member $node lan/$lan" .
745
746
747
748
		    " $bandwidth 0 0";
		if ($emulated) {
		    print TOPFILE " emulated";
		}
749
750
751
		if ($trivial_ok) {
		    print TOPFILE " trivial_ok";
		}
752
		print TOPFILE "\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
753
754
755
	    }
	}
    }
756
    # If a LAN has only one member we don't do anything.
Leigh B. Stoller's avatar
Leigh B. Stoller committed
757
758
}

Shashi Guruprasad's avatar
Shashi Guruprasad committed
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
# XXX NSE hack
# Will find a free randomly chosen pc850 and fix sim nodes to it
# Assign's scoring needs to be fixed so that the solution has
# as many sim nodes on a phy node as possible while maxing out
# its interfaces. Currently having sim:N where N is a large
# number in the ptop file does not guarantee that all these
# get mapped to a single phy node even when that mapping has no
# violations and a low score. distributed nse will fix this
#$result =
#  DBQueryFatal("select a.node_id,a.type from nodes as a ".
#	   "left join reserved as b on a.node_id=b.node_id ".
#	   "left join reserved as m on a.phys_nodeid=m.node_id ".
#	   "where b.node_id is null and (a.role='testnode' and ".
#	   "      a.type='pc850' and ".
#	   "       (m.node_id is null or ".
#	   "        m.pid!='$DEADPID' or m.eid!='$DEADEID'))");
if( scalar(@simnodelist) > 0 ) {
  open(AVAIL,"$TBROOT/sbin/avail type=pc rand |")
    or die "*** $0:\n".
           "    avail failed\n";

  my $num = 0;
  while (<AVAIL>) {
    if (! /^\|/) {next};
    if (/node_id/) {next;}
    ($fixednode,$type) = /^\|([-a-zA-Z0-9]+)\s*\|(\w+)\s*\|(\w+)\s*\|$/;    
    $num++;
    last;
  }
  close(AVAIL);
  
  if( $num == 0 ) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
791
    print STDERR "$0: *** Insufficient PCs available.\n";
Shashi Guruprasad's avatar
Shashi Guruprasad committed
792
793
794
795
796
797
798
799
    exit(2);
  }

  foreach $simnode (@simnodelist) {
    print TOPFILE "fix-node $simnode $fixednode\n";
  }
}

800
# Print out fixed nodes
Chad Barb's avatar
   
Chad Barb committed
801
802
803
804
# But _not_ nodes which aren't in the experiment any more.
# CRB you can only fix nodes and delaynodes, right?
$reused_count = 0;

805
foreach $fixed (keys(%fixed_nodes)) {
Chad Barb's avatar
   
Chad Barb committed
806
807
    if (!$isremotenode{$fixed} && 
	(exists $nodes{$fixed} || exists $delaynodes{$fixed}) ) {
808
	print TOPFILE "fix-node $fixed $fixed_nodes{$fixed}\n";
Chad Barb's avatar
   
Chad Barb committed
809
	if ($reserved_nodes{$fixed}) { $reused_count++; }
810
    }
811
812
}

Leigh B. Stoller's avatar
Leigh B. Stoller committed
813
814
close TOPFILE;

815
# Set estimations
Chad Barb's avatar
   
Chad Barb committed
816
817
$minimum_nodes = $nodes + keys(%delaynodes)/$DELAYCAPACITY - $reused_count;
$maximum_nodes = $nodes + keys(%delaynodes) - $reused_count;
818
DBQueryFatal("UPDATE experiments set maximum_nodes=$maximum_nodes, " .
819
	 "minimum_nodes=$minimum_nodes where pid=\"$pid\" and eid=\"$eid\"");
820
print "Minimum nodes = $minimum_nodes\n";
821
822
print "Maximum nodes = $maximum_nodes\n";

823
824
TBDebugTimeStamp("top finished");

Leigh B. Stoller's avatar
Leigh B. Stoller committed
825
826
827
828
829
830
831
832
833
######################################################################
# Step 2 - Assign Loop
# 
# Here we loop up to maxrun times.  In each loop we snapshot the
# current testbed state into a ptop file.  We then run assign.  If
# assign succeeds we attempt to reserve the resources.  If that works
# we're done with step 2 otherwise we loop again.
#
# v2pmap is indexed by virtual and contains the physical node.
Shashi Guruprasad's avatar
Shashi Guruprasad committed
834
# p2vmap is indexed by physical and contains one or more virtual nodes
Leigh B. Stoller's avatar
Leigh B. Stoller committed
835
836
837
838
839
# plinks is indexed by virtual name and contains 
#  (pnodeportA,pnodeportB) .  If one is a delay node it is always
#  the second.
#######################################################################

840
TBDebugTimeStamp("assign_loop started");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
841
842
843
844
845
$currentrun = 1;
while (1) {
    print "Assign Run $currentrun\n";

    # Violation counts
846
    $unassigned = -1;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
847
848
849
850
851
852
853
854
    $linkusers = -1;
    $bandwidth = -1;
    $desires = -1;

    # Clear v2pmap, p2vmap, and plinks
    undef %v2pmap;
    undef %p2vmap;
    undef %plinks;
855
856
    undef %toreserve;
    undef %virtnodes;
Shashi Guruprasad's avatar
Shashi Guruprasad committed
857
    
858
    TBDebugTimeStamp("ptopgen started");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
859
    # Snapshot
Chad Barb's avatar
   
Chad Barb committed
860
861
862
863
864
865
866
867
868
869
    #
    # if updating (-u), include any resources that may already be
    # allocated to experiment in the PTOP results.
    #
    if ($updating) {
	system("ptopgen -e $pid/$eid > $ptopfile");
    } else {
	system("ptopgen > $ptopfile");
    }

870
    TBDebugTimeStamp("ptopgen finished");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
871
872

    # Get number of nodes
873
874
    my $numnodes_result = 
	DBQueryFatal("select a.node_id,a.type from" .
Leigh B. Stoller's avatar
Leigh B. Stoller committed
875
876
877
		     " nodes as a left join reserved as b" .
		     " on a.node_id=b.node_id" .
		     " where b.node_id is null" .
878
		     " and a.role='testnode' and a.type!='dnard'");
879
    $numnodes = $numnodes_result->numrows;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
880
881
    
    if ($numnodes < $minimum_nodes) {
882
	print STDERR "$0: *** Insufficient nodes available.\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
883
884
885
	exit(2);
    }

886
    TBDebugTimeStamp("assign started");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
887
888
    # Run assign
    $fail = 0;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
889
    my $cmdargs = "$ptopfile $topfile";
890
    $cmdargs = "-p $cmdargs"
891
	if ($virtcount);
892
893
    print "assign $cmdargs\n";
    open(ASSIGNFP,"assign $cmdargs | tee assign.log |");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
894
895
896
897
898
899
900
901
    $violations = 0;
    $score = -1;

    # read output
    # Header
    printdb "Reading assign results.\n";
    while (<ASSIGNFP>) {
	chop;
902
903
904
905
	/No physical nodes of type (.+)$/ && do {
	    $score=-2;
	    print $_ . "\n";
	};
Leigh B. Stoller's avatar
Leigh B. Stoller committed
906
907
908
909
	/^With ([0-9]+) violations$/ && do {
	    $violations = $1;
	    last;
	};
910
 	/^[ \t]+BEST SCORE: [ \t]+([0-9]+(\.[0-9]+)?)/ && ($score=$1);
Leigh B. Stoller's avatar
Leigh B. Stoller committed
911
    }
912
913
914
915
916
    if ($score == -2) {
	# Type error
	print "Giving up.\n";
	exit(2);
    }
Leigh B. Stoller's avatar
Leigh B. Stoller committed
917
918
919
920
921
922
923
924
925
926
927
    printdb "Found score $score, violations $violations.\n";

    # We don't bother reading anything else if violations occured.
    if (($violations == 0) && ($score != -1)) {
	# read nodes section
	while (<ASSIGNFP> !~ /^Nodes:/) {}
	printdb "Nodes:\n";
	while (<ASSIGNFP>) {
	    chop;
	    /^End Nodes$/ && last;
	    @info = split;
928
929
930
931
932
933
	    ($virtual,$physical) = @info[0,1];

	    # We don't care about LAN nodes anymore.
	    if (defined($lannodes{$virtual})) {
		next;
	    }
Chad Barb's avatar
   
Chad Barb committed
934

Chad Barb's avatar
   
Chad Barb committed
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
	    if ($alreadyAllocated{$physical}) {
		#
		# Mark node as being reused.
		#
		# Look at virtual node being mapped to node;
		# if it wasn't in the previous map, mark node for reboot.
		# 
		if (! exists $reserved_nodes{$virtual} ||
		    $reserved_nodes{$virtual} ne $physical ||
		    $alreadyAllocated{$physical} eq "reboot") {
		    $alreadyAllocated{$physical} = "reboot";
		} else {
		    $alreadyAllocated{$physical} = "reused";
		}
	    } else {
		#
		# This is a new node; we'll have to reserve it.
		#
Chad Barb's avatar
   
Chad Barb committed
953
954
		$toreserve{$physical} = 1;	    
	    }
955
956
957
958
959
960
961
962
963
964
965
	    
	    if ($isvirtnode{$virtual}) {
		#
		# If mapping a virtual node, then record that, since we need
		# to allocate the virtnodes on that physnode, later.
		#
		if (!defined($virtnodes{$physical})) {
		    $virtnodes{$physical} = [];
		}
		push(@{$virtnodes{$physical}}, $virtual);
	    }
Leigh B. Stoller's avatar
Leigh B. Stoller committed
966
	    $v2pmap{$virtual} = $physical;
Shashi Guruprasad's avatar
Shashi Guruprasad committed
967
	    if( ! defined($p2vmap{$physical}) ) {
968
		$p2vmap{$physical} = [];
Shashi Guruprasad's avatar
Shashi Guruprasad committed
969
970
	    }
	    push(@{$p2vmap{$physical}}, $virtual);
Leigh B. Stoller's avatar
Leigh B. Stoller committed
971
972
973
974
975
976
977
978
	    printdb "  $virtual $physical\n";
	}

	# read Edges
	# By convention, in plinks, the delay node is always the second
	# entry.
	while (<ASSIGNFP> !~ /^Edges:/) {}
	printdb "Edges:\n";
Shashi Guruprasad's avatar
Shashi Guruprasad committed
979
980
	EDGEWHILE: while (<ASSIGNFP>) {
	    /^End Edges$/ && last EDGEWHILE;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
981
982
983
984
985
986
987
988
989
	    @info = split;
	    $line = $_;
	    $_ = $info[1]; # type
	  SWITCH1: {
	      /^intraswitch$/ && do {
		  ($vlink,$rawA,$rawB) = @info[0,3,5];
		  last SWITCH1;
	      };
	      /^interswitch$/ && do {
990
991
		  ($vlink,$rawA,$rawB) = @info[0,3,$#info];
		  last SWITCH1;
Leigh B. Stoller's avatar
Leigh B. Stoller committed
992
993
	      };
	      /^direct$/ && do {
994
995
		  die("*** $0:\n".
		      "    Unsupported link type: direct.\n");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
996
	      };
Shashi Guruprasad's avatar
Shashi Guruprasad committed
997
998
999
1000
1001
1002
	      /^trivial$/ && do {
		  # we don't have plinks for trivial links
		  $vlink = $info[0];
		  $plinks{$vlink} = [];
		  next EDGEWHILE;
	      };
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1003
1004
	      print "Found garbage: $line\n";
	  }
1005
1006
1007
1008
	    $nodeportA = &getnodeport($rawA);
	    $nodeportB = &getnodeport($rawB);
	    $nodeportA =~ s/\//:/;
	    $nodeportB =~ s/\//:/;
1009
	    $plinks{$vlink} = [$nodeportA,$nodeportB];
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1010
1011
1012
1013
1014
1015
	    printdb "  $vlink " . join(" ",@{$plinks{$vlink}}) . "\n";
	}
    } else {
	# spit out up to nodes
	print "ASSIGN FAILED:\n";       
	while (<ASSIGNFP>) {
1016
	    if (/link_users:\s*(\d+)$/) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1017
		$linkusers = $1;
1018
	    } elsif (/bandwidth:\s*(\d+)$/) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1019
		$bandwidth = $1;
1020
	    } elsif (/unassigned:\s*(\d+)$/) {
1021
		$unassigned = $1;
1022
	    } elsif (/desires:\s*(\d+)$/) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1023
1024
1025
1026
1027
1028
1029
1030
1031
		$desires = $1;
	    }
	    if (/^Nodes:/) {last;}
	    print "$_";
	}
	$fail = 1;
    }
    while (<ASSIGNFP>) { } # Read anything left in the pipe before closing
    close(ASSIGNFP);
1032
    TBDebugTimeStamp("assign finished");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1033

1034
    TBDebugTimeStamp("reserving started");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1035
    # Reserve resources
1036
    if (!$fail) {
1037
	if (system("nalloc $pid $eid " . join(" ", keys(%toreserve)))) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1038
	    print "Failed to reserve nodes. Trying again.\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1039
	} else {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1040
	    print "Successfully reserved physical nodes\n";
Chad Barb's avatar
   
Chad Barb committed
1041
1042
1043
1044
1045
1046

	    foreach $node (keys(%toreserve)) {
		# in future, this will be a fully enforced state machine.
		TBSetNodeAllocState( $node, TBDB_ALLOCSTATE_RES_INIT_DIRTY() );
	    }

1047
	    TBDebugTimeStamp("reserving finished");
Chad Barb's avatar
   
Chad Barb committed
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070

	    my %tolose = ();
	    foreach $node (keys(%alreadyAllocated)) {
		if ($alreadyAllocated{$node} eq "unused") {
		    #
		    # Node was used in previous incarnation, but not any more.
		    #
		    $tolose{$node} = 1;
		} elsif ($alreadyAllocated{$node} eq "reboot") {
		    #
		    # Node is being reused, but for a different purpose, so
		    # it should be rebooted.
		    #
		    TBSetNodeAllocState( $node, TBDB_ALLOCSTATE_RES_INIT_DIRTY() );
		}
	    }
	    
	    if ((keys %tolose) > 0) {
		if (system("nfree $pid $eid " . join(" ", keys(%tolose)))) {
		    print "Failed to free no-longer-needed nodes!";
		}
	    }

Leigh B. Stoller's avatar
Leigh B. Stoller committed
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
	    last;
	}
    }

    # Check for exit
    if ($currentrun >= $maxrun) {
	$exitcode = 1;
	if ($bandwidth > 0) {
	    $exitcode += 4;
	} 
	if ($linkusers > 0) {
	    $exitcode += 8;
	}
	if ($desires > 0) {
	    $exitcode += 16;
	}
1087
1088
1089
	if ($unassigned > 0) {
	    $exitcode += 32;
	}
1090
1091
	print "*** $0:\n".
	      "    Reached run limit. Giving up. Exitcode: $exitcode.\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1092
1093
1094
1095
1096
	exit($exitcode);
    }
    $currentrun++;
}

1097
1098
TBDebugTimeStamp("assign_loop finished");

1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
###########################################################################
# Step 2A
#
# We run the wanassigner to allocate remote nodes. We do this after cause
# it takes so long. We run it just once.
#
# wanassign does its own nalloc.
#
###########################################################################

1109
1110
1111
1112
1113
1114
1115
1116
#
# VIRTNODES HACK: physical nodes (from the nodes table) might really
# be a virtual node :-) Must record the underlying phys_nodeid and an
# indicator for jail.
#
my %jailed = ();

# Now allocate the remote nodes. 
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
if (scalar(keys(%isremotenode))) {
    my $success  = 0;
    my $doremote = 0;
    
    foreach my $value (values(%isremotenode)) {
	if ($value) {
	    $doremote = 1;
	}
    }
    
    if ($doremote) {
	print "Running 'wanassign -d $pid $eid'\n";
	open(WANFP,"wanassign -d $pid $eid 2>&1 | tee wanassign.log |") or
	    die("*** $0:\n".
		"    Failed to start wanassign: $!\n");

	printdb "Reading wanassign results.\n";
	while (<WANFP>) {
	    chop;
	    if ($_ =~ /(\S+) mapsto (\S+)/) {
1137
		$v2vmap{$1} = $2;
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
		printdb "  $1 $2\n";
	    }
	    if ($_ =~ /^Success/) {
		$success = 1;
	    }
	    # Skip other output. Usually its debugging output.
	}
	close(WANFP) or
	    die("*** $0:\n".
		"    wanassign: " . $? ? "exited with status: $?.\n" :
		                         "error closing pipe: $!\n");

	if (!$success) {
	    die("*** $0:\n".
		"    wanassign could not find a solution!\n");
	}
1154
1155
1156
	foreach my $virtual (keys(%v2vmap)) {
	    my $physical = $v2vmap{$virtual};
	    my $jailflag;
1157
	    my $phys_nodeid;
1158
1159

	    TBIsNodeVirtual($physical, \$jailflag);
1160
1161
1162
1163
1164
1165
1166
1167
	    TBPhysNodeID($physical, \$phys_nodeid);
	    
	    $v2pmap{$virtual} = $phys_nodeid;
	    if ( !defined($p2vmap{$phys_nodeid})) {
		$p2vmap{$phys_nodeid} = [];
	    }
	    push(@{$p2vmap{$phys_nodeid}}, $virtual);

1168
1169
	    $jailed{$virtual}  = $jailflag;
	}
1170
1171
1172
1173
	TBDebugTimeStamp("wanassign finished");
    }
}

Leigh B. Stoller's avatar
Leigh B. Stoller committed
1174
#
1175
1176
1177
1178
# VIRTNODES HACK: Local virtnodes have to be mapped now. This is a little
# hokey in that the virtnodes just need to be allocated from the pool that
# is on the real node. We know they are free, but we should go through
# nalloc anyway.
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1179
#
1180
1181
1182
foreach my $pnode (keys(%virtnodes)) {
    my @vlist = @{$virtnodes{$pnode}};
    my @plist = ();
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1183
1184

    #
1185
1186
1187
1188
1189
1190
    # Run avail to get the list of virtnodes on the phys node. We already
    # know there are enough, since assign knows that.
    #
    my $num  = @vlist;
    
    open(AVAIL,"$TBROOT/sbin/avail virtonly=$pnode rand limit=$num |")
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1191
1192
1193
1194
1195
1196
1197
1198
1199
	or die("*** $0:\n".
	       "    avail failed\n");

    while (<AVAIL>) {
	next
	    if (! /^\|/);
	next
	    if (/node_id/);
	
1200
1201
	my ($nodeid) = /^\|([-a-zA-Z0-9]+)\s*\|(\w+)\s*\|(\w+)\s*\|$/;
	push(@plist, $nodeid);
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1202
1203
1204
    }
    close(AVAIL);

1205
    if (scalar(@vlist) != scalar(@plist)) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1206
	print STDERR "*** $0:\n".
1207
	    "Could not map some virtual nodes on $pnode\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1208
1209
1210
1211
1212
	exit(2);
    }

    #
    # Try to allocate. Note, if this fails we are done for. Okay for now
1213
    # since it is never the case that it should fail!
1214
    #
1215
1216
    print "Reserving @plist ...\n";
    if (system("nalloc $pid $eid @plist")) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1217
	die("*** $0:\n".
1218
	    "Failed to reserve @plist (on $pnode)\n");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1219
    }
1220
1221
1222
    while (@plist) {
	my $physical = pop(@plist);
	my $virtual  = pop(@vlist);
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1223

1224
1225
	$v2vmap{$virtual}  = $physical;
	printdb "  Mapping $virtual to $physical on $pnode\n";
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1226

1227
1228
	my $jailflag;
	my $phys_nodeid;
1229

1230
1231
1232
	TBIsNodeVirtual($physical, \$jailflag);
	
	$jailed{$virtual}  = $jailflag;
1233
1234
    }
}
1235

Leigh B. Stoller's avatar
Leigh B. Stoller committed
1236
TBExptSetPortRange();
1237

Leigh B. Stoller's avatar
Leigh B. Stoller committed
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
1263
######################################################################
# Step 3 - Convert to vlans, delays, and portmap
# 
# Here we convert the plinks into vlans, delays, and portmap.  We
# convert them first into internal datastructure.  After Step 4
# when we do some port swapping we'll upload the modified versions
# of these structures into the database.
#
# delays is indexed by an internal ID and contains:
#  [pnode, int0, int1, vname, delay, bandwidth, lossrate]
# portmap is indexed by <virtual node>:<virtual port> and contains
#  the physical port.
#
# vlan ids
#  vlan ids are increasing integers in the case of node<->delay connections.
#  In the case of actual LANs either of real node or of delay nodes
#  they are indexed by virtual lan name.
# delay ids
#  delay ids are increasing integers.  We could have used a list of
# delays just as well.  Having it as an array may prove useful for
# future changes however.
######################################################################

$delayid = 0;

printdb "Interpreting results.\n";
1264
TBDebugTimeStamp("interpreting started");
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1265
foreach $plink (keys(%plinks)) {
Shashi Guruprasad's avatar
Shashi Guruprasad committed
1266

1267
    # trivial links do not have physical links
Shashi Guruprasad's avatar
Shashi Guruprasad committed
1268
1269
1270
1271
    if( scalar(@{$plinks{$plink}}) == 0 ) {
      next;
    }
    
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1272
1273
1274
1275
    ($nodeportA,$nodeportB) = @{$plinks{$plink}};
    ($nodeA,$portA) = split(":",$nodeportA);
    ($nodeB,$portB) = split(":",$nodeportB);
    printdb "plink $plink - $nodeportA $nodeportB\n";
1276
    if (($lan,$virtA,$virtC) = ($plink =~ m|^linksdelaysrc/(.+)/(.+),(.+)$|)) {
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1277
1278
1279
1280
	# Node has a single entry in lan.
	# Node is nodeportA
	# Delay node is nodeportB
	# Other end of delay node will be given by plink
1281
1282
	#   linksdelaydst/lan/virtC,virtA where nodeportA will be the other 
	#   node in the virtual LAN and nodeportB will be the other end of the
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1283
	#   delay node.
1284
1285
	($nodeportC,$nodeportD) =
	    @{$plinks{"linksdelaydst/$lan/$virtC,$virtA"}};
Leigh B. Stoller's avatar
Leigh B. Stoller committed
1286
1287
1288
1289
1290
1291
1292
	($nodeC,$portC) = split(":",$nodeportC);
	($nodeD,$portD) = split(":",$nodeportD);
	printdb "LINK delay: other end = $nodeportC $nodeportD\n";

	# assert nodeB == nodeD

	printdb "  VLANS:\n";
1293
1294
	AddVlan("link", "$lan" . "-delaysrc", $nodeportA, $nodeportB);
	AddVlan("link", "$lan" . "-delaydst", $nodeportC, $nodeportD);
1295
1296