Index: trunk/tools/editor_trends/etl/enricher.py |
— | — | @@ -610,8 +610,8 @@ |
611 | 611 | article = {} |
612 | 612 | article['revisions'] = [] |
613 | 613 | id = False |
614 | | - #elif wikilytics == True and event == 'end': |
615 | | - # elem.clear() |
| 614 | + elif event == 'end': |
| 615 | + elem.clear() |
616 | 616 | |
617 | 617 | |
618 | 618 | def stream_raw_xml(input_queue, storage, process_id, function, dataset, locks, rts): |
— | — | @@ -735,7 +735,7 @@ |
736 | 736 | function = create_variables |
737 | 737 | storage = 'csv' |
738 | 738 | dataset = 'training' |
739 | | - processors = cpu_count() |
| 739 | + processors = 6 |
740 | 740 | extension = 'bz2' |
741 | 741 | setup(storage) |
742 | 742 | multiprocessor_launcher(function, path, dataset, storage, processors, extension) |
— | — | @@ -775,6 +775,6 @@ |
776 | 776 | |
777 | 777 | |
778 | 778 | if __name__ == '__main__': |
779 | | - #launcher_training() |
| 779 | + launcher_training() |
780 | 780 | #launcher_prediction() |
781 | | - launcher(rts) |
| 781 | + #launcher(rts) |