radip/NetworkManager.py at master · azyner/radip · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
# Class that handles a single instance of a network.
# Defines the training / testing state,
#  manages tensorboard handles.

# Step function should go here, that means it needs to be passed a BatchHandler,
# so that it can grab data easily
# This should also have the different test types, such as the accuracy graph
# Should it handle the entirety of crossfolding?
# I don't think so, that should go into another class maybe
import matplotlib
matplotlib.use('Agg')
import matplotlib.pyplot as plt
import tensorflow as tf
import os
import numpy as np
import pandas as pd
from bokeh.plotting import figure, output_file, save
from bokeh.models.widgets import PreText
from bokeh.layouts import widgetbox
from bokeh.layouts import layout
import StringIO
import sys
import glob
import time
import matplotlib as mpl
from bokeh.models import ColumnDataSource, HoverTool, Div
import shutil
import dill as pickle
from dyn_rnn_model import DynamicRnnSeq2Seq

import subprocess


class NetworkManager:
    def __init__(self, parameters, log_file_name=None):
        self.parameters = parameters
        self.network = None
        self.batchHandler = None
        self.sess = None
        self.device = None
        self.log_file_name = log_file_name
        self.model = None
        #if parent dir is train_dir, we have a checkpoint. No
        if self.parameters['train_dir'] in os.path.basename(os.path.abspath(os.path.join(log_file_name,os.pardir))):
            self.plot_directory = os.path.join(self.parameters['master_dir'], 'plots')
            # self.network_name_string = "temp123456" # The unique network name descriptor.
            self.train_dir = os.path.join(self.parameters['master_dir'], self.parameters['train_dir'])
            self.checkpoint_dir = os.path.join(self.train_dir, os.path.basename(self.log_file_name))
            self.summaries_dir = None
        else:
            self.plot_directory = os.path.join(self.parameters['master_dir'],'plots')
            #self.network_name_string = "temp123456" # The unique network name descriptor.
            self.train_dir = os.path.join(self.parameters['master_dir'], self.parameters['train_dir'])
            self.checkpoint_dir = os.path.join(self.train_dir, os.path.basename(self.log_file_name))
            self.summaries_dir = os.path.join(self.parameters['master_dir'],'tensorboard_logs')
        self.train_writer = None
        self.val_writer = None
        self.graph_writer = None
        self.ckpt_dict = {}
        self.global_state_cached = False
        self.global_state_cache = None

        self.tensorboard_graph_summaries= []
        self.tensorboard_metric_summaries = []

        self.plot_feeds = None
        self.plot_output = None
        self.metric_feeds = None
        self.metric_output = None
        self.plt_size = (10,10) #Odd format, this is multiplied by 80 to get pixel size (blame matplotlib)

        # Silence illegal summary names INFO warning.
        # It warns that ':' is illegal. However, its in the variable.name, so I can't avoid it without
        # overly verbose code.
        tf.logging.set_verbosity(tf.logging.ERROR)
        self.p_child_list = []

        return

    def build_model(self,encoder_means=None, encoder_stddev=None):
        tf.reset_default_graph()
        self.device = tf.device(self.parameters['device'])
        gpu_options = tf.GPUOptions(per_process_gpu_memory_fraction=0.9,allow_growth=True)
        self.sess = tf.Session(config=tf.ConfigProto(allow_soft_placement=True,gpu_options=gpu_options))

        if not os.path.exists(self.train_dir):
            os.makedirs(self.train_dir)
        if not os.path.exists(self.checkpoint_dir):
            os.makedirs(self.checkpoint_dir)
        ckpt = tf.train.get_checkpoint_state(self.checkpoint_dir)
        if ckpt and tf.gfile.Exists(ckpt.model_checkpoint_path + ".index"): #TODO is +.index a hack?
            print("Reading model parameters from %s" % ckpt.model_checkpoint_path)
            #tf.train.import_meta_graph(ckpt.model_checkpoint_path + ".meta")
            #saver = tf.train.Saver()
            self.model = DynamicRnnSeq2Seq(self.parameters)
            self.model.saver.restore(self.sess, ckpt.model_checkpoint_path)
        else:
            print("Created model with fresh parameters.")
            if encoder_means is None or encoder_stddev is None:
                print "Error! New model needs input scaling parameters for input normalization"
                exit(1)
                # Get scaling factors

            self.model = DynamicRnnSeq2Seq(self.parameters)
            # IMPORTANT set norm params must occur after init, otherwise the values get clobbered
            self.sess.run(tf.global_variables_initializer())
            if self.parameters['use_scaling']:
                self.model.set_normalization_params(self.sess, encoder_means, encoder_stddev)
            else:
                self.model.set_normalization_params(self.sess, [0]*len(encoder_means), [1]*len(encoder_stddev))
            print "Scaling layer means"
            print self.model.scaling_layer[0].eval(session=self.sess)
            print "Scaling layer standard dev"
            print self.model.scaling_layer[1].eval(session=self.sess)

        if self.summaries_dir is not None:
            self.train_writer = tf.summary.FileWriter(os.path.join(self.summaries_dir, self.log_file_name+'train'),
                                                      graph=self.sess.graph)
            self.val_writer = tf.summary.FileWriter(os.path.join(self.summaries_dir, self.log_file_name+'val'),
                                                    graph=self.sess.graph)
            self.graph_writer = tf.summary.FileWriter(os.path.join(self.summaries_dir, self.log_file_name + 'graph'),
                                                      graph=self.sess.graph)
            self.test_writer = tf.summary.FileWriter(os.path.join(self.summaries_dir, self.log_file_name + 'test'),
                                                     graph=self.sess.graph)
        else:
            self.train_writer = None
            self.val_writer = None
            self.graph_writer = None
            self.test_writer = None

        return

    def log_graphs_to_tensorboard(self,graphs):
        img_values = []
        for i in range(len(graphs)):
            img_summary = tf.Summary.Image(encoded_image_string=graphs[i],height=self.plt_size[1],width=self.plt_size[0])
            summary_value = tf.Summary.Value(tag=str(i),image=img_summary)
            img_values.append(summary_value)

        summary_str = tf.Summary(value=img_values)

        self.graph_writer.add_summary(summary_str, self.model.global_step.eval(session=self.sess))
        return

    # Logs a list of floats that are passed as args into Tensorboard, so they can be graphed over time.
    def log_metric_to_tensorboard(self,metrics):
        m_values = []
        for i in range(len(metrics)):
            summary_value = tf.Summary.Value(tag="metric_"+str(i),simple_value=metrics[i])
            m_values.append(summary_value)
        summary_str = tf.Summary(value=m_values)
        self.graph_writer.add_summary(summary_str, self.model.global_step.eval(session=self.sess))
        return

    def get_global_step(self):
        if self.global_state_cached == True:
            return self.global_state_cache
        else:
            self.global_state_cache = self.model.global_step.eval(session=self.sess)
            self.global_state_cached = True
        return self.global_state_cache

    def get_learning_rate(self):
        return self.model.learning_rate.eval(session=self.sess)

    def decay_learning_rate(self):
        self.sess.run(self.model.learning_rate_decay_op)
        return

    def run_training_step(self, X, Y, weights, train_model, trackwise_padding=None, summary_writer=None):
        self.global_state_cached = False
        return self.model.step(self.sess, X, Y, weights, train_model, trackwise_padding, summary_writer=summary_writer)

    def draw_categorical_bokeh_linear_plot(self, graph_results):
        plot_titles = np.sort(graph_results['origin'].unique())
        plots = []

        for origin in plot_titles:
            if self.parameters['data_format'] == 'legacy':
                if os.path.exists("QDA/" + origin + ".npy"):
                    QDA_data = np.load("QDA/" + origin + ".npy")
                QDA_mean = QDA_data[0] / 100
                QDA_meanpstd = QDA_data[1] / 100
                QDA_meanmstd = QDA_data[2] / 100
                QDA_range = np.array(range(len(QDA_mean)))
                QDA_range -= 40

            plt_title = 'Accuracy as measured relative to 20m mark. Averaged over all tracks'
            # plot 1
            dataset = graph_results[graph_results['origin'] == origin]
            x_data = []
            y_data = []
            tp_data = []
            fp_data = []
            fn_data = []
            try:
                f1_labels = True
                graph_results['f1_score']
                for range_val in np.unique(dataset['distance']):
                    data_at_range = dataset[dataset['distance'] == range_val]
                    x_data.append(range_val)
                    y_data.append(data_at_range['f1_score'][0])
                    tp_data.append(data_at_range['true_positive'][0])
                    fp_data.append(data_at_range['false_positive'][0])
                    fn_data.append(data_at_range['false_negative'][0])
            except KeyError:
                f1_labels = False
                for range_val in np.unique(dataset['d_thresh']):
                    # If I group by track number here, I can get a collection of accuracy scores
                    # and therefore a std dev
                    data_at_range = dataset[dataset['d_thresh'] == range_val]
                    acc = np.average(np.equal(data_at_range['output_idxs'],
                                              data_at_range['destination_vec']))
                    x_data.append(range_val)
                    y_data.append(acc)

            p1 = figure(title='Origin: ' + origin, x_axis_label='Dis from Ref Line (m)', y_axis_label='Acc.',
                        plot_width=500, plot_height=500,x_range=(-12, 35), y_range=(0, 1.05),)  # ~half a 1080p screen
            if not f1_labels:
                p1.line(x_data, y_data, legend="Acc. RNN", line_width=2, color='green')
            else:
                p1.line(x_data, y_data, legend="F1 Score RNN", line_width=2, color='green')
                p1.line(x_data, tp_data, legend="True Positive Percent RNN", line_width=2, color='yellow')
                p1.line(x_data, fp_data, legend="False Positive Percent RNN", line_width=2, color='orange')
                p1.line(x_data, fn_data, legend="False Negative Percent RNN", line_width=2, color='blue')

            if self.parameters['data_format'] == 'legacy':
                p1.line(QDA_range, QDA_mean, legend="Acc. QDA", line_width=2, color='red', line_alpha=1)
            # p1.line(QDA_range, QDA_meanmstd, line_width=2, color='red', line_alpha=0.5)
            # p1.line(QDA_range, QDA_meanpstd, line_width=2, color='red', line_alpha=0.5)
            # p1.line(bbox_range, loss, legend="Loss.", line_width=2, color='blue')
            # p1.line(bbox_range, output_gen_plt[:, 1], legend="Generated Output.", line_width=2, color='red')
            p1.legend.location = "bottom_right"
            plots.append(p1)
        return plots

    def draw_categorical_bokeh_topographical_plot(self, results_per_dis_df, batch_handler):
        image_filename = 'leith-croydon.png'
        if not os.path.exists(os.path.join(self.plot_directory,image_filename)):
            shutil.copy(os.path.join('images',image_filename),os.path.join(self.plot_directory,image_filename))

        plots = []
        batch_handler.data_pool.track_idx.unique()
        data_pool = batch_handler.data_pool

        for track_origin in np.sort(results_per_dis_df['origin'].unique()):
            # 1 plot per origin
            track_origin_df = results_per_dis_df[results_per_dis_df.origin == track_origin]

            tooltips = []
            for name in ['Accuracy','Object_X','Object_Y','distance','distance_to_exit','AbsVelocity']:
                   tooltips.append(tuple([name, "@" + name])) # X,Y Vel, Distance to xx, accuracy.
            hover = HoverTool(tooltips=tooltips)

            p = figure(plot_height=500, plot_width=500, title=track_origin, x_range=(-35, 10), y_range=(-30, 15),
                       tools=[hover, 'pan', 'wheel_zoom', 'box_zoom', 'reset', 'resize'])
            # Angle is in radians, rotates around anchor
            p.image_url([image_filename], x=-15.275, y=-3.1, w=147.45, h=77.0, angle=0,
                        anchor='center', global_alpha=0.7)

            for destination in track_origin_df['destination'].unique():
                dest_class_df = track_origin_df[track_origin_df['destination']==destination]
                x_av = []
                y_av = []
                acc = []
                dis_to_exit_av = []
                vel_av = []
                for dis in np.sort(dest_class_df['d_thresh'].unique()):
                    d_thresh_df = dest_class_df[dest_class_df['d_thresh'] == dis]
                    x_av.append(np.average(d_thresh_df['Object_X']))
                    y_av.append(np.average(d_thresh_df['Object_Y']))
                    vel_av.append(np.average(d_thresh_df['AbsVelocity']))
                    acc.append(np.average(np.average(np.equal(d_thresh_df['output_idxs'],
                                                               d_thresh_df['destination_vec']))))
                    dis_to_exit_av.append(np.average(d_thresh_df['distance_to_exit']))

                    colours= [
                    "#%02x%02x%02x" % (int(r), int(g), int(b)) for r, g, b, _ in
                    255 * mpl.cm.plasma(mpl.colors.Normalize(vmin=0.3,vmax=1.0)(acc))
                    ]
                source_df = pd.DataFrame({"Object_X": x_av,
                                          "Object_Y": y_av,
                                          "Accuracy":acc,
                                          "distance_to_exit":dis_to_exit_av,
                                          'distance':np.sort(dest_class_df['d_thresh'].unique()),
                                          'AbsVelocity':vel_av,
                                          'colours':colours})
                plot_source = ColumnDataSource(data=source_df)
                p.circle(x="Object_X", y="Object_Y", size=4, fill_color="colours", fill_alpha=0.6,
                         line_color="colours", source=plot_source)
            plots.append(p)

        return plots

    def draw_categorical_html_graphs(self, batch_handler):

        if not os.path.exists(self.plot_directory):
            os.makedirs(self.plot_directory)
        plt_path = os.path.join(self.plot_directory, os.path.basename(self.log_file_name) + '.html')
        # If I am running this many times, make new filenames
        if os.path.exists(plt_path):
            path_idx = 1
            while os.path.exists(plt_path):
                plt_path = os.path.join(self.plot_directory,
                                        os.path.basename(self.log_file_name) + "-%02d" % path_idx + '.html')
                path_idx += 1

        output_file(plt_path)

        results_per_dis = self.compute_result_per_dis(batch_handler, plot=False)
        # Run a model loaded from checkpoint, then save results_per_dis to pickle (dill), with parameters as well.
        # Then I can pass all those into a directory, and run the plotter again.
        pkl_path = os.path.join(self.plot_directory, os.path.basename(self.log_file_name) + '.pkl')
        with open(pkl_path,'wb') as pkl_file:
            to_pkl = {'parameters': self.parameters,
                      'results_per_dis': results_per_dis}
            pickle.dump(to_pkl,pkl_file)
        dis_f1_report = self.compute_distance_f1_report(results_per_dis)
        top_plots = self.draw_categorical_bokeh_topographical_plot(results_per_dis, batch_handler)
        linear_plots = self.draw_categorical_bokeh_linear_plot(results_per_dis)

        #topographical_plots = self.draw_bokeh_topographical_plot(graph_results)

        # Dump all the metadata to a big string.
        label_str = ""
        for key, value in self.parameters.iteritems():
            label_str += str(key) + ': ' + str(value) + "\r\n"
        paragraph_1 = PreText(text=label_str)


        l = layout([top_plots, linear_plots, [widgetbox(paragraph_1, width=800)]])
        save(l)
        # show(widgetbox(button_1, width=300))

        return

    def draw_categorical_png_graphs_perf_dist(self, graph_results):
        fig_dir = self.plot_directory + "_img"
        if not os.path.exists(fig_dir):
            os.makedirs(fig_dir)

        graph_list = []

        plot_titles = graph_results['origin'].unique()
        for origin in plot_titles:
            if self.parameters['data_format'] == 'legacy':
                if os.path.exists("QDA/" + origin + ".npy"):
                    QDA_data = np.load("QDA/" + origin + ".npy")
                QDA_mean = QDA_data[0] / 100
                QDA_meanpstd = QDA_data[1] / 100
                QDA_meanmstd = QDA_data[2] / 100
                QDA_range = np.array(range(len(QDA_mean)))
                QDA_range -= 40
            dataset = graph_results[graph_results['origin'] == origin]
            x_data = []
            y_data = []
            tp_data = []
            fp_data = []
            fn_data = []
            try:
                f1_labels = True
                graph_results['f1_score']
                for range_val in np.unique(dataset['distance']):
                    data_at_range = dataset[dataset['distance'] == range_val]
                    x_data.append(range_val)
                    y_data.append(data_at_range['f1_score'][0])
                    tp_data.append(data_at_range['true_positive'][0])
                    fp_data.append(data_at_range['false_positive'][0])
                    fn_data.append(data_at_range['false_negative'][0])

            except KeyError:
                f1_labels = False
                for range_val in np.unique(dataset['d_thresh']):
                    # If I group by track number here, I can get a collection of accuracy scores
                    # and therefore a std dev
                    data_at_range = dataset[dataset['d_thresh'] == range_val]
                    acc = np.average(np.equal(data_at_range['output_idxs'],
                                              data_at_range['destination_vec']))
                    x_data.append(range_val)
                    y_data.append(acc)

            legend_str = []
            fig = plt.figure(figsize=self.plt_size)


            if self.parameters['data_format'] == 'legacy':
                plt.plot(QDA_range, QDA_mean,'r-')
                legend_str.append(['Acc. QDA'])
            plt.title('Origin: ' + origin)
            plt.xlabel('Distance from Ref Line (m)')
            if not f1_labels:
                plt.plot(x_data, y_data, 'g-', label=origin)
                plt.ylabel('Accuracy')
                legend_str.append(['Acc. RNN'])
            else:
                plt.plot(x_data, y_data, 'g-', label=origin)
                plt.ylabel('Value')
                legend_str.append(['F1 Score'])
                plt.plot(x_data, fp_data,'r-')
                legend_str.append(['False Positive Percent'])
                plt.plot(x_data, fn_data,'b-')
                legend_str.append(['False Negative Percent'])
                plt.plot(x_data, tp_data,'c-')
                legend_str.append(['True Positive Percent'])
            plt.legend(legend_str, loc='upper left')

            fig_path = os.path.join(self.plot_directory + "_img", self.log_file_name + '-' +
                                    str(self.get_global_step()) + '-' + origin+ '.png')
            plt.savefig(fig_path, bbox_inches='tight')

            fig.canvas.draw()
            fig_s = fig.canvas.tostring_rgb()
            fig_data = np.fromstring(fig_s,np.uint8)
            fig_data = fig_data.reshape(fig.canvas.get_width_height()[::-1] + (3,))
            s = StringIO.StringIO()
            plt.imsave(s, fig_data,format='png')
            fig_data = s.getvalue()
            graph_list.append(fig_data)
            plt.close()

        return graph_list

    # def _pick_class(self,distribution):
    #     threshold = 0.95
    #     pop = np.sum(distribution)
    #     distribution = distribution / pop
    #     (dist_results.iloc[0]['dest_1_hot'].astype(int) == (dist_results.iloc[0]['output_pop'][0] > 95).astype(
    #         int)).all()
    #
    #     return

    def draw_generative_html_graphs(self, batch_handler, multi_sample=1):

        if not os.path.exists(self.plot_directory):
            os.makedirs(self.plot_directory)
        plt_path = os.path.join(self.plot_directory, str(multi_sample) + "-" + os.path.basename(self.log_file_name) + '.html')
        # If I am running this many times, make new filenames
        if os.path.exists(plt_path):
            path_idx = 1
            while os.path.exists(plt_path):
                plt_path = os.path.join(self.plot_directory,
                                        os.path.basename(self.log_file_name) + "-%02d" % path_idx + '.html')
                path_idx += 1

        output_file(plt_path)

        #results_per_dis = self.compute_result_per_dis(batch_handler, plot=False)
        # Get some results here
        # I am going to run a single full sequence on a batch. Then pick first N sequences to create N graphs.

        #Get results:
        batch_frame = batch_handler.get_minibatch()
        graph_x, graph_future, weights, graph_labels, track_padded = \
            batch_handler.format_minibatch_data(
                batch_frame['encoder_sample'],
                batch_frame['decoder_sample'],
                batch_frame['batchwise_padding'],
                batch_frame['trackwise_padding'] if self.parameters['track_padding'] else None)
        train_y = graph_future

        multi_sampled_predictions = []
        observations = batch_frame['encoder_sample'].values
        ground_truths = batch_frame['decoder_sample'].values
        csv_names = batch_frame['csv_name'].values

        for i in range(multi_sample):
            # BEGIN Run this step 100 times and dimensionalize results.
            return_val = self.model.step(self.sess, graph_x, train_y, weights, False, track_padded, summary_writer=None)
            acc = return_val[0]
            loss = return_val[1]
            model_outputs = return_val[2]
            mixtures = return_val[3]
            padding = return_val[4]
            multi_sampled_predictions.append(np.swapaxes(np.array(model_outputs), 0, 1))

        # END

        multi_sampled_predictions = np.swapaxes(np.array(multi_sampled_predictions),0,1)

        # I should probably copy all images here.
        image_filename = 'leith-croydon.png'
        if not os.path.exists(os.path.join(self.plot_directory, image_filename)):
            shutil.copy(os.path.join('images', image_filename), os.path.join(self.plot_directory, image_filename))

        plots = []
        plot_count = 0
        for obs, preds, gt, csv_name in zip(observations, multi_sampled_predictions, ground_truths, csv_names):
            #New plot

            if 'queen-hanks' in csv_name:
                x_range = (3, 47)
                y_range = (-17, 11)
            if 'leith-croydon' in csv_name:
                x_range = (-35, 10)
                y_range = (-30, 15)
            if 'roslyn-crieff' in csv_name:
                x_range = (-31, -10)
                y_range = (-15, 8)
            if 'oliver-wyndora' in csv_name:
                x_range = (-28, -8)
                y_range = (-12, 6)
            if 'orchard-mitchell' in csv_name:
                x_range = (-32, -5)
                y_range = (-23, 5)

            p = figure(plot_height=500, plot_width=500, title="Generative track testing",
                       x_range=x_range, y_range=y_range)
            if 'leith-croydon' in csv_name:
                p.image_url(['leith-croydon.png'], x=-15.275, y=-3.1, w=147.45, h=77.0, angle=0,
                        anchor='center', global_alpha=0.7)

            p.line(gt[:,0],gt[:,1],line_color='blue',legend='Ground_truth')
            p.line(obs[:,0],obs[:,1],line_color='green',legend='observation')
            for j in range(preds.shape[0]):
                p.line(preds[j][:,0],preds[j][:,1],line_color='red',legend='prediction')

            plots.append([p])
            plot_count += 1
            if plot_count > 20:
                break

        # Plot results:
        #top_plots = self.draw_categorical_bokeh_topographical_plot(outputs, batch_handler)
        #linear_plots = self.draw_categorical_bokeh_linear_plot(outputs)

        #topographical_plots = self.draw_bokeh_topographical_plot(graph_results)

        # Dump all the metadata to a big string.
        label_str = ""
        for key, value in self.parameters.iteritems():
            label_str += str(key) + ': ' + str(value) + "\r\n"
        paragraph_1 = PreText(text=label_str)

        plots.append([widgetbox(paragraph_1, width=800)])
        #l = layout([top_plots, linear_plots, [widgetbox(paragraph_1, width=800)]])
        save(layout(plots))
        # show(widgetbox(button_1, width=300))

        return

    def join_subprocesses(self):
        # Join.
        for p_child in self.p_child_list:
            while p_child.poll() is None:
                time.sleep(0.1)
        # Now that all children have finished, we may empty the list.
        self.p_child_list = []

    def draw_generative_png_graphs(self, batch_handler, multi_sample=1, draw_prediction_track=True, final_run=False, ):

        if not final_run:
            fig_dir = self.plot_directory + "_img"
        else:
            fig_dir = self.plot_directory + "_img_final"
        if not os.path.exists(fig_dir):
            os.makedirs(fig_dir)

        #Get results:
        if final_run:
            batch_handler.set_distance_threshold(0)
            batch_frame, _ = batch_handler.get_sequential_minibatch()
            batch_handler.set_distance_threshold(None)
        else:
            batch_frame = batch_handler.get_minibatch()

        graph_x, graph_future, weights, graph_labels, trackwise_padding = \
            batch_handler.format_minibatch_data(
                batch_frame['encoder_sample'],
                batch_frame['decoder_sample'],
                batch_frame['batchwise_padding'],
                batch_frame['trackwise_padding'] if self.parameters['track_padding'] else None)
        observations = batch_frame['encoder_sample'].values
        ground_truths = batch_frame['decoder_sample'].values
        csv_names = batch_frame['csv_name'].values
        train_y = graph_future
        # Drawing a single mixture sample from the network (the normal operation) results in a list of len 1
        multi_sampled_predictions = []
        multi_sampled_mixtures = []
        multi_sampled_padding_logits = []

        for i in range(multi_sample):
            return_val = self.model.step(self.sess, graph_x, train_y, weights, False, trackwise_padding, summary_writer=None)
            acc = return_val[0]
            loss = return_val[1]
            model_outputs = return_val[2]
            mixtures = return_val[3]
            padding_logits = return_val[4]
            num_mixtures = len(mixtures[0][0]) / 6
            multi_sampled_mixtures.append(mixtures.reshape(mixtures.shape[0], mixtures.shape[1], num_mixtures, 6, order='F'))
            multi_sampled_predictions.append(np.swapaxes(np.array(model_outputs), 0, 1))
            multi_sampled_padding_logits.append(np.array(padding_logits))

        multi_sampled_predictions = np.swapaxes(np.array(multi_sampled_predictions), 0, 1)
        multi_sampled_mixtures = np.swapaxes(np.array(multi_sampled_mixtures), 0, 1)
        multi_sampled_padding_logits = np.swapaxes(np.array(multi_sampled_padding_logits), 0, 1)
        # Now the first dimension is whether I wanted to pull multiple outputs from the same input Monte Carlo style
        # Only works if the network is non-deterministic in some way.
        graph_list = []
        graph_number = 0
        graph_max = 20 if final_run else 10
        multithread = True
        if multithread:
            # Wait for any old threads to finish. Not allowed to spawn multiple sets of children, it gets out of hand fast.
            self.join_subprocesses()
        for obs, preds, gt, mixes, csv_name, pad_logits, trackwise_padding, rel_destination in zip(
                observations, multi_sampled_predictions, ground_truths, multi_sampled_mixtures, csv_names,
                multi_sampled_padding_logits, np.array(trackwise_padding).transpose(), batch_frame.relative_destination):
            graph_number += 1
            # WARNING! If you want more than ten, turn off multithreading. I don't use a queue.
            # The kernel handles all of them, so they will all get memory alloc. Looks to be 200MB each
            if graph_number > graph_max:
                break

            if multithread:
                args_dict = {"obs": obs,
                             "preds": {"RNN": preds},
                             "gt": gt,
                             "mixes": mixes,
                             "pad_logits": pad_logits,
                             "trackwise_padding": trackwise_padding,
                             "plt_size": self.plt_size,
                             "draw_prediction_track": draw_prediction_track,
                             "plot_directory": self.plot_directory,
                             "log_file_name": self.log_file_name,
                             "multi_sample": multi_sample,
                             "global_step": self.get_global_step(),
                             "graph_number": graph_number,
                             "fig_dir": fig_dir,
                             "csv_name": csv_name,
                             "padding_logits": multi_sampled_padding_logits,
                             "relative_destination": rel_destination,
                             'parameters': self.parameters,
                             'padding_mask': 'None'}
                # HACK I would prefer a child that then maintains its own children with queued workers. This allows
                # the child process to hand out fresh jobs without interrupting main, but its a lot of work. So instead,
                # to stop starving main, I force these to only be able to use half the cores.
                p_child = subprocess.Popen(["taskset", "-c", "0,1,2,3",
                                            "nice", "-n", "19",
                                            "/usr/bin/python2", "utils_draw_graphs.py"], stdin=subprocess.PIPE)
                p_child.stdin.write(pickle.dumps(args_dict))
                p_child.stdin.close()
                self.p_child_list.append(p_child)
            else:
                import utils_draw_graphs
                graph_list.append(utils_draw_graphs.draw_png_heatmap_graph(obs, {"RNN": preds}, gt, mixes, pad_logits,
                                                                           trackwise_padding,
                                                                           self.plt_size, draw_prediction_track,
                                  self.plot_directory, self.log_file_name, multi_sample,
                                  self.get_global_step(), graph_number, fig_dir, csv_name, rel_destination, self.parameters, padding_mask='None'))

        if multithread and final_run:
            self.join_subprocesses()
        return graph_list

    def compute_distance_f1_report(self, dist_results):
        # Maybe at the end of training I want a ROC curve on the confidence threshold.
        # Right now I want an F1 score with a default threshold.

        # FIXME can I get classes a better way?
        classes = dist_results.origin.unique()
        f1_df_list = []

        # Declare class based on output_pop
        population = np.sum(dist_results.iloc[0]['output_pop'])
        dist_results = dist_results.assign(norm_pop=dist_results['output_pop']/population)
        class_threshold = 0.95
        dist_results = dist_results.assign(chosen_pop=pd.Series([(x > class_threshold).astype(float) for x in dist_results['norm_pop']]))
        dist_results['correct_classification'] = \
            dist_results.apply(lambda x: True if (x['chosen_pop'] == x['dest_1_hot']).all() else False, axis=1)
        dist_results['any_classification'] = \
            dist_results.apply(lambda x: True if (x['chosen_pop']).any() else False, axis=1)

        for distance in dist_results['d_thresh'].unique():
            distance_set = dist_results[dist_results['d_thresh'] == distance]

            #f1 score calc needs:
            # True positive = number correctly classified
            # False Positive = Number incorrectly classified as this class
            # False Negative = Number without class, or wrong class.
            for origin in classes:
                origin_subset = distance_set[distance_set['origin'] == origin]
                origin_dist = len(origin_subset)
                TP = len(origin_subset[origin_subset['correct_classification'] == True])
                FN = len(origin_subset[origin_subset['any_classification'] == False])
                FP = origin_dist - TP - FN
                #print ("Dis: %3.2fm Dest: %5s TP %2d FN %2d FP %2d" % (distance, dest, TP, FN, FP))
                try:
                    f1 = 2*TP / float(2*TP + FP + FN)
                except ZeroDivisionError:
                    f1 = 0.0
                n_tracks = len(origin_subset)
                if n_tracks == 0: n_tracks = 1 # If this is zeo, then FP,FN and TP are zero as well..
                f1_df_list.append(pd.DataFrame({"origin": origin,
                                                "distance": distance,
                                                "f1_score": f1,
                                                "true_positive": TP / n_tracks,
                                                "false_positive": FP / n_tracks,
                                                "false_negative": FN / n_tracks,
                                                "n_tracks": n_tracks
                                                },index=[0]))
        f1_df = pd.concat(f1_df_list)
        return f1_df

    # This function needs the validation batch (or test batch)
    # This is to be refactored as a report writer, that is done every n minutes
    # ~5 min for soak, ~20 min for long
    # This system should then do a ROC analysis at each distance we care about
    def compute_result_per_dis(self, batch_handler, plot=True):
        # Legacy plot needs exactly one data point per meter.
        min_plot = max([-15,int(0.5+min(batch_handler.data_pool['distance']))])
        max_plot = min([60,int(max(batch_handler.data_pool['distance']))])
        print "min_plot: " + str(min_plot) + ' max_plot: ' + str(max_plot)
        if plot:
            bbox_range_plot = np.arange(min_plot,max_plot,1).tolist()
        else:
            bbox_range_plot = np.arange(min_plot, max_plot, 0.5).tolist()

        graph_results = []
        # This could be optimized.
        # If the batch size is larger than twice a sequential minibatch
        # I could run two distances per step.
        print ""
        #TEMP
        if True:
        #batch_handler.generate_distance_minibatches(bbox_range_plot)
        # for d in bbox_range_plot:
        #     sys.stdout.write("\rGenerating distance report: %03.1fm %10s" % (d, ''))
        #     sys.stdout.flush()
            # Set d_thresh
            # Do it in a loop in case batch_size < num_val_tracks
            dis_thresh_time = time.time()
            #batch_handler.set_distance_threshold(d)
            batch_handler.set_distance_threshold_ranges(bbox_range_plot)
            #print "Time to set dis thresh: " + str (time.time() - dis_thresh_time)
            batch_complete = False

            batch_time = time.time()
            busy_indicator = ['-', '\\', '|', '/']
            batch_counter = 0
            while not batch_complete:
                #print "Running batch"
                sys.stdout.write("\rWriting distance report...%s" % busy_indicator[batch_counter%len(busy_indicator)])
                sys.stdout.flush()
                mini_batch_frame, batch_complete = batch_handler.get_sequential_minibatch()
                #TODO check if mini_batch_frame is empty here. If I have no data at all for this range.
                if mini_batch_frame is None:
                    break
                val_x, val_future, val_weights, val_labels, track_padded = \
                    batch_handler.format_minibatch_data(mini_batch_frame['encoder_sample'],
                                                        mini_batch_frame['dest_1_hot'] if
                                                        self.parameters['model_type'] == 'classifier' else
                                                        mini_batch_frame['decoder_sample'] if
                                                        self.parameters['model_type'] == 'MDN' else exit(2),
                                                        mini_batch_frame['batchwise_padding'],
                                                        mini_batch_frame['trackwise_padding'] if
                                                        self.parameter_dict['track_padding'] else None)
                valid_data = np.logical_not(mini_batch_frame['batchwise_padding'].values)
                val_y = val_labels if self.parameters['model_type'] == 'classifier' else \
                          val_future if self.parameters['model_type'] == 'MDN' else exit(3)
                #print "Time to get minibatch: " + str(time.time()-batch_time)

                #TODO Param this:
                output_samples = []
                num_samples = 1
                for _ in range(num_samples):
                    acc, loss, outputs, mixtures, padding = self.model.step(self.sess, val_x, val_y,
                                                         val_weights, False, track_padded, summary_writer=None)
                    # Do a straight comparison between val_y and outputs.
                    #output_idxs = np.argmax(outputs[0][valid_data], axis=1)
                    output_samples.append(outputs)

                #Get a population count of what the network thinks.
                output_samples_arr = np.array(output_samples).squeeze(axis=1)
                output_1_hot = np.eye(output_samples_arr.shape[2])[np.argmax(output_samples_arr, axis=2)]
                output_pop = np.sum(output_1_hot,axis=0)

                #Get a percentage of population in the correct class.
                y_idxs = np.argmax(val_y,axis=2).squeeze()
                acc_pop = output_pop[0][y_idxs]/num_samples

                # Drop all results that are just padding to make the minibatch square.
                output_pop = output_pop[valid_data]
                acc_pop = acc_pop[valid_data]
                mini_batch_frame = mini_batch_frame[mini_batch_frame['batchwise_padding'] == False]

                # TODO Repeal and replace this qualifier.
                # Compute max pop. Assign it to idx for now. LEGACY FUNCTION
                output_idxs = np.argmax(output_pop,axis=1)
                mini_batch_frame = mini_batch_frame.assign(output_idxs=output_idxs)
                mini_batch_frame = mini_batch_frame.assign(acc_pop=acc_pop)
                mini_batch_frame = mini_batch_frame.assign(output_pop=pd.Series([x for x in output_pop],dtype=object))
                #mini_batch_frame = mini_batch_frame.assign(d_thresh=np.repeat(d,len(mini_batch_frame)))

                graph_results.append(mini_batch_frame)
                batch_counter += 1
            print "Time to run dis batches: " + str(time.time() - batch_time)

        #Concat once only, much faster
        graph_results_frame = pd.concat(graph_results)

        # Reset handler
        batch_handler.set_distance_threshold(None)
        batch_handler.set_distance_threshold_ranges(None)

        return graph_results_frame

    def evaluate_pdis_metric(self, results):

        d_array = []
        for origin in results['origin'].unique():
            # Generate the set of all distances that are not 100% accurate (i.e. they have a incorrect classification)
            # Remove from the set of all distances, creating only a set of distances with a perfect score
            # Return lowest number (the earliest result)
            dis_unique = results['d_thresh'].unique()
            dist_delta = dis_unique[1] - dis_unique[0]
            reduced_df = results[results['origin']==origin]
            perfect_dist = np.setdiff1d(dis_unique,
                                        reduced_df[
                                            reduced_df['destination_vec']!=reduced_df['output_idxs']
                                        ].d_thresh.unique())
            #If we got none right OR the final value is incorrect (rare case)
            if (len(perfect_dist) < 2) or\
                    (perfect_dist[-1] != dis_unique[-1]):
                d_array.append(np.max(dis_unique))
            else:
                # Find the end of the continuous sequence at the end of the graph
                # Return this point
                for i in reversed(range(1,len(perfect_dist))):
                    if perfect_dist[i] - perfect_dist[i-1] != dist_delta:
                        break
                perfect_dist_threshold = perfect_dist[i]
                d_array.append(np.min(perfect_dist_threshold))

        return d_array, results['origin'].unique()

    def evaluate_0_acc_metric(self, results):
        for origin in results['origin'].unique():
            origin_results = results[results['origin']==origin]
            origin_0_results = origin_results[origin_results['d_thresh']==0]


        return results


    # Function that passes the entire validation dataset through the network once and only once.
    # Return cumulative accuracy, loss
    def run_validation(self, batch_handler, summary_writer=None, quick=False, report_writing=False, distance_threshold=0):
        batch_complete = False
        batch_losses = []
        total_correct = 0
        total_valid = 0
        all_averages = []
        report_list = []
        if report_writing:
            batch_handler.set_distance_threshold(distance_threshold)
        while not batch_complete:
            #val_x, val_y, val_weights, pad_vector, batch_complete = batch_handler.get_sequential_minibatch()
            if quick or (self.parameters['model_type']=='MDN' and not report_writing):
                # Run one regular batch. Debug mode takes longer, and there are ~30,000 val samples
                mini_batch_frame = batch_handler.get_minibatch()
                batch_complete = True
                #print "Debug active, valdating with random sample, not whole batch"
            else:
                mini_batch_frame, batch_complete = batch_handler.get_sequential_minibatch()

            val_x, val_future, val_weights, val_labels, track_padded = batch_handler.format_minibatch_data(
                mini_batch_frame['encoder_sample'],
                mini_batch_frame['dest_1_hot'] if self.parameters['model_type'] == 'classifier' else
                mini_batch_frame['decoder_sample'] if self.parameters['model_type'] == 'MDN' else exit(2),
                mini_batch_frame['batchwise_padding'],
                mini_batch_frame['trackwise_padding'] if self.parameters['track_padding'] else None)
            valid_batch_data = np.logical_not(mini_batch_frame['batchwise_padding'].values)
            val_y = val_labels if self.parameters['model_type'] == 'classifier' else \
                val_future if self.parameters['model_type'] == 'MDN' else exit(3)

            acc, loss, outputs, mixtures, padding_logits = \
                self.model.step(self.sess, val_x, val_y, val_weights, False, track_padded, summary_writer=summary_writer)

            if self.parameters['model_type'] == 'classifier':
                output_idxs = np.argmax(outputs[0][valid_batch_data], axis=1)
                y_idxs = np.argmax(np.array(val_y)[0][valid_batch_data], axis=1)
                num_correct = np.sum(np.equal(output_idxs,y_idxs)*1)
                num_valid = np.sum(valid_batch_data*1)
                total_correct += num_correct
                total_valid += num_valid
            if report_writing:
                # TODO If multi-sampled mixtures is desired at test/validation report time, it needs to be implemented here
                mini_batch_frame = mini_batch_frame[valid_batch_data]
                outputs_a = np.swapaxes(np.array(outputs), 0, 1)
                mixture_components = 6
                num_mixtures = len(mixtures[0][0]) / mixture_components
                mixtures = np.array(mixtures.reshape(mixtures.shape[0], mixtures.shape[1], num_mixtures, mixture_components, order='F'))
                # Reject batchwise padding multi_sampled_mixtures.append()
                outputs_ar = [np.array([x]) for x in outputs_a[valid_batch_data]]
                # Single item list for multisample compatibility
                mixtures_ar = [np.array([x]) for x in mixtures[valid_batch_data]]
                padding_logits_ar = [np.array([x]) for x in padding_logits[valid_batch_data]]

                mini_batch_frame = mini_batch_frame.assign(outputs=outputs_ar)
                mini_batch_frame = mini_batch_frame.assign(mixtures=mixtures_ar)
                mini_batch_frame = mini_batch_frame.assign(padding_logits=padding_logits_ar)

                report_list.append(mini_batch_frame)

            batch_losses.append(loss)
            all_averages.append(acc)

        if self.parameters['model_type'] == 'classifier':
            batch_acc = np.float32(total_correct) / np.float32(total_valid)
        else:
            batch_acc = np.mean(all_averages)

        if report_writing:
            batch_handler.set_distance_threshold(None)
            report_df = pd.concat(report_list)
        else:
            report_df = None

        return batch_acc, np.average(batch_losses), report_df, None

    # Checkpoints model. Adds path to global dict lookup
    def checkpoint_model(self):
        self.ckpt_dict[self.get_global_step()] = \
            self.model.saver.save(self.sess, os.path.join(self.checkpoint_dir, 'model-chkpt'),
                              global_step=self.get_global_step())

    def load_from_checkpoint(self,g_step=None):
        ckpt = tf.train.get_checkpoint_state(self.checkpoint_dir)
        if g_step:
            ckpt_dir = self.ckpt_dict[g_step]
        else:
            ckpt_dir = ckpt.model_checkpoint_path
        if ckpt and ckpt_dir:
            print("Reading model parameters from %s" % ckpt_dir)
            self.model.saver.restore(self.sess, ckpt_dir)
        return

    def clean_checkpoint_dir(self,g_step=None):
        ckpt = tf.train.get_checkpoint_state(self.checkpoint_dir)
        for checkpoint in ckpt.all_model_checkpoint_paths:
            if (g_step is not None and
                checkpoint != self.ckpt_dict[g_step]):
                [os.remove(file) for file in glob.glob(checkpoint + "*")]