source: trunk/FACT++/scripts/takeRun.js@ 18087

Last change on this file since 18087 was 17926, checked in by tbretz, 10 years ago
Added handling for Critical and OnStandby status of feedback.
File size: 10.1 KB
Line 
1'use strict';
2
3// ================================================================
4// Code related to monitoring the fad system
5// ================================================================
6
7var incomplete = 0;
8
9sub_incomplete.onchange = function(evt)
10{
11 if (!evt.data)
12 return;
13
14 var inc = evt.obj['incomplete'];
15 if (!inc || inc>0xffffffffff)
16 return;
17
18 if (incomplete>0)
19 return;
20
21 if (dim.state("MCP").name!="TakingData")
22 return;
23
24 console.out("");
25 dim.log("Incomplete event ["+inc+","+incomplete+"] detected, sending MCP/STOP");
26
27 incomplete = inc;
28 dim.send("MCP/STOP");
29}
30
31// ================================================================
32// Code related to taking data
33// ================================================================
34
35/**
36 * reconnect to problematic FADs
37 *
38 * Dis- and Reconnects to FADs, found to be problematic by call-back function
39 * onchange() to have a different CONNECTION value than 66 or 67.
40 *
41 * @returns
42 * a boolean is returned.
43 * reconnect returns true if:
44 * * nothing needed to be reset --> no problems found by onchange()
45 * * the reconnection went fine.
46 *
47 * reconnect *never returns false* so far.
48 *
49 * @example
50 * if (!sub_connections.reconnect())
51 * exit();
52 */
53function reconnect(list, txt)
54{ /*
55 var reset = [ ];
56
57 for (var i=0; i<list.length; i++)
58 {
59 console.out(" FAD %2d".$(list[i])+" lost during "+txt);
60 reset.push(parseInt(list[i]/10));
61 }
62
63 reset = reset.filter(function(elem,pos){return reset.indexOf(elem)==pos;});
64
65 console.out("");
66 console.out(" FADs belong to crate(s): "+reset);
67 console.out("");
68*/
69 console.out("");
70 dim.log("Trying automatic reconnect ["+txt+",n="+list.length+"]...");
71
72 if (list.length>3)
73 throw new Error("Too many boards to be reconnected. Please check what happened.");
74
75 for (var i=0; i<list.length; i++)
76 {
77 console.out(" ...disconnect "+list[i]);
78 dim.send("FAD_CONTROL/DISCONNECT", list[i]);
79 }
80
81 console.out(" ...waiting for 3s");
82 v8.sleep(3000);
83
84 for (var i=0; i<list.length; i++)
85 {
86 console.out(" ...reconnect "+list[i]);
87 dim.send("FAD_CONTROL/CONNECT", list[i]);
88 }
89
90 console.out(" ...waiting for 1s");
91
92 // Wait for one second to bridge possible pending connects
93 v8.sleep(1000);
94
95 console.out(" ...checking connection");
96
97 // Wait for FAD_CONTROL to realize that all boards are connected
98 // FIXME: Wait for '40' boards being connected instead
99 try
100 {
101 dim.wait("FAD_CONTROL", "Connected", 3000);
102 }
103 catch (e)
104 {
105 if (dim.state("FAD_CONTROL").name!="Connecting")
106 {
107 console.out("");
108 console.out(" + FAD_CONTROL: "+dim.state("FAD_CONTROL").name);
109 console.out("");
110 throw e;
111 }
112
113 var crates = [];
114 for (var i=0; i<list.length; i++)
115 crates[list[i]/4] = true;
116
117 include('scripts/crateReset.js');
118 crateReset(crates);
119 }
120
121 // Wait also for MCP to have all boards connected again
122 dim.wait("MCP", "Idle", 3000);
123
124 dim.log("Automatic reconnect successfull.");
125 console.out("");
126}
127
128function takeRun(type, count, time)
129{
130 if (!count)
131 count = -1;
132 if (!time)
133 time = -1;
134
135 var nextrun = sub_startrun.get().obj['next'];
136 dim.log("Take run %3d".$(nextrun)+": N="+count+" T="+time+"s ["+type+"]");
137
138 // FIXME: Replace by callback?
139 //
140 // DN: I believe instead of waiting for 'TakingData' one could split this
141 // up into two checks with an extra condition:
142 // if type == 'data':
143 // wait until ThresholdCalibration starts:
144 // --> this time should be pretty identical for each run
145 // if this takes longer than say 3s:
146 // there might be a problem with one/more FADs
147 //
148 // wait until "TakingData":
149 // --> this seems to take even some minutes sometimes...
150 // (might be optimized rather soon, but still in the moment...)
151 // if this takes way too long:
152 // there might be something broken,
153 // so maybe a very high time limit is ok here.
154 // I think there is not much that can go wrong,
155 // when the Thr-Calib has already started. Still it might be nice
156 // If in the future RateControl is written so to find out that
157 // in case the threshold finding algorithm does
158 // *not converge as usual*
159 // it can complain, and in this way give a hint, that the weather
160 // might be a little bit too bad.
161 // else:
162 // wait until "TakingData":
163 // --> in a non-data run this time should be pretty short again
164 // if this takes longer than say 3s:
165 // there might be a problem with one/more FADs
166 //
167
168 // Use this if you use the rate control to calibrate by rates
169 //if (!dim.wait("MCP", "TakingData", -300000) )
170 //{
171 // throw new Error("MCP took longer than 5 minutes to start TakingData"+
172 // "maybe this idicates a problem with one of the FADs?");
173 //}
174
175 // ================================================================
176 // Function for Critical voltage
177 // ================================================================
178
179 // INSTALL a watchdog... send FAD_CONTROL/CLOSE_OPEN_FILES
180 // could send MCP/RESET as well but would result in a timeout
181 var callback = dim.onchange['FEEDBACK'];
182 dim.onchange['FEEDBACK'] = function(state)
183 {
184 if (callback)
185 callback.call(this, state);
186
187 if ((state.name=="Critical" || state.name=="OnStandby") &&
188 (this.last!="Critical" && this.last!="OnStandby"))
189 {
190 console.out("Feedback state changed from "+this.last+" to "+state.name+" [takeRun.js]");
191
192 // Includes FAD_CONTROL/CLOSE_ALL_OPEN_FILES
193 dim.send("MCP/STOP");
194 }
195
196 this.last=state.name;
197 }
198
199 // Here we could check and handle fad losses
200
201 incomplete = 0;
202
203 var start = true;
204
205 for (var n=0; n<3; n++)
206 {
207 if (start)
208 dim.send("MCP/START", time, count, type);
209
210 try
211 {
212 dim.wait("MCP", "TakingData", 15000);
213 break;
214 }
215 catch (e)
216 {
217 if (dim.state("MCP").name=="TriggerOn" &&
218 dim.state("FAD_CONTROL").name=="Connected" &&
219 dim.state("FTM_CONTROL").name=="TriggerOn")
220 {
221 console.out("");
222 console.out("Waiting for TakingData timed out. Everything looks ok, but file not yet open... waiting once more.");
223 start = false;
224 continue;
225 }
226
227 start = true;
228
229 console.out("");
230 console.out(" + MCP: "+dim.state("MCP").name);
231 console.out(" + FAD_CONTROL: "+dim.state("FAD_CONTROL").name);
232 console.out(" + FTM_CONTROL: "+dim.state("FTM_CONTROL").name);
233 console.out("");
234
235 if (dim.state("MCP").name!="Configuring3" ||
236 (dim.state("FAD_CONTROL").name!="Configuring1" &&
237 dim.state("FAD_CONTROL").name!="Configuring2"))
238 throw e;
239
240 console.out("");
241 console.out("Waiting for fadctrl to get configured timed out... checking for in-run FAD loss.");
242
243 var con = sub_connections.get();
244 var stat = con.obj['status'];
245
246 console.out("Sending MCP/RESET");
247 dim.send("MCP/RESET");
248
249 dim.wait("FTM_CONTROL", "Valid", 3000);
250 dim.wait("FAD_CONTROL", "Connected", 3000);
251 dim.wait("MCP", "Idle", 3000);
252
253 var list = [];
254 for (var i=0; i<40; i++)
255 if (stat[i]!=0x43)
256 list.push(i);
257
258 reconnect(list, "configuration");
259
260 if (n==2)
261 throw e;
262
263 //dim.wait("MCP", "Idle", 3000);
264 }
265 }
266
267 // This is to check if we have missed the event. This can happen as
268 // a race condition when the MCP/STOP is sent by the event handler
269 // but the run was not yet fully configured.
270 var statefb = dim.state("FEEDBACK").name;
271 if (statefb=="Critical" || statefb=="OnStandby")
272 {
273 console.out("Run started by FEEDBACK in state "+statefb);
274 dim.send("MCP/STOP"); // Includes FAD_CONTROL/CLOSE_ALL_OPEN_FILES
275
276 dim.onchange['FEEDBACK'] = callback;
277
278 return true;
279 }
280
281 dim.wait("MCP", "Idle", time>0 ? time*1250 : undefined); // run time plus 25%
282
283 // REMOVE watchdog
284 dim.onchange['FEEDBACK'] = callback;
285
286 if (incomplete)
287 {
288 console.out("");
289 console.out(" - MCP: "+dim.state("MCP").name);
290 console.out(" - FAD_CONTROL: "+dim.state("FAD_CONTROL").name);
291 console.out(" - FTM_CONTROL: "+dim.state("FTM_CONTROL").name);
292
293 dim.wait("FTM_CONTROL", "Valid", 3000);
294 dim.wait("FAD_CONTROL", "Connected", 3000);
295 dim.wait("MCP", "Idle", 3000);
296
297 var str = incomplete.toString(2);
298 var len = str.length;
299
300 var list = [];
301 for (var i=0; i<str.length; i++)
302 if (str[str.length-i-1]=='1')
303 list.push(i);
304
305 reconnect(list, "data taking");
306
307 return false;
308 }
309
310 // FIXME: What if the ext1 is not enabled in the configuration?
311 if (type=="data")
312 {
313 var dim_trg = new Subscription("FAD_CONTROL/TRIGGER_COUNTER");
314 var counter = dim_trg.get(3000);
315
316 // The check on physics and pedestal triggers is to ensure that
317 // there was at least a chance to receive any event (e.g. in case
318 // of an interrupt this might not be the case)
319 if (counter.qos!=111 &&
320 (counter.data['N_trg']>1000 || counter.data['N_ped']>5) &&
321 counter.data['N_ext1']==0) // 'o' for open
322 throw new Error("No ext1 triggers received during data taking... please check the reason and report in the logbook.");
323 dim_trg.close();
324 }
325
326 return true;
327}
Note: See TracBrowser for help on using the repository browser.