Hide keyboard shortcuts

Hot-keys on this page

r m x p   toggle line displays

j k   next/prev highlighted chunk

0   (zero) top of page

1   (one) first highlighted chunk

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

79

80

81

82

83

84

85

86

87

88

89

90

# -*- coding: utf-8 -*- 

# 

# Licensed under the Apache License, Version 2.0 (the "License"); 

# you may not use this file except in compliance with the License. 

# You may obtain a copy of the License at 

# 

# http://www.apache.org/licenses/LICENSE-2.0 

# 

# Unless required by applicable law or agreed to in writing, software 

# distributed under the License is distributed on an "AS IS" BASIS, 

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 

# See the License for the specific language governing permissions and 

# limitations under the License. 

 

import multiprocessing 

import subprocess 

import time 

 

from builtins import range 

 

from airflow import configuration 

from airflow.executors.base_executor import BaseExecutor 

from airflow.utils.state import State 

from airflow.utils.logging import LoggingMixin 

 

PARALLELISM = configuration.get('core', 'PARALLELISM') 

 

 

class LocalWorker(multiprocessing.Process, LoggingMixin): 

 

def __init__(self, task_queue, result_queue): 

multiprocessing.Process.__init__(self) 

self.task_queue = task_queue 

self.result_queue = result_queue 

self.daemon = True 

 

def run(self): 

while True: 

key, command = self.task_queue.get() 

if key is None: 

# Received poison pill, no more tasks to run 

self.task_queue.task_done() 

break 

self.logger.info("{} running {}".format( 

self.__class__.__name__, command)) 

command = "exec bash -c '{0}'".format(command) 

try: 

subprocess.check_call(command, shell=True) 

state = State.SUCCESS 

except subprocess.CalledProcessError as e: 

state = State.FAILED 

self.logger.error("failed to execute task {}:".format(str(e))) 

# raise e 

self.result_queue.put((key, state)) 

self.task_queue.task_done() 

time.sleep(1) 

 

 

class LocalExecutor(BaseExecutor): 

""" 

LocalExecutor executes tasks locally in parallel. It uses the 

multiprocessing Python library and queues to parallelize the execution 

of tasks. 

""" 

 

def start(self): 

self.queue = multiprocessing.JoinableQueue() 

self.result_queue = multiprocessing.Queue() 

self.workers = [ 

LocalWorker(self.queue, self.result_queue) 

for i in range(self.parallelism) 

] 

 

for w in self.workers: 

w.start() 

 

def execute_async(self, key, command, queue=None): 

self.queue.put((key, command)) 

 

def sync(self): 

while not self.result_queue.empty(): 

results = self.result_queue.get() 

self.change_state(*results) 

 

def end(self): 

# Sending poison pill to all worker 

[self.queue.put((None, None)) for w in self.workers] 

# Wait for commands to finish 

self.queue.join() 

self.sync()