a few ideas extra

7 years ago · 05fed36ac8
parent 0e7ba25b76
commit 05fed36ac8
1 changed files with 44 additions and 38 deletions
--- a/backfiller/backfiller.py
+++ b/backfiller/backfiller.py
@ -3,6 +3,10 @@
 # lots about web services and the like I don't know
 # needs logging, exception handling and the like
 # when starting the backfiller and every few hours, backfill everything
 # more frequently, backfill the last couple hours
 # (last three hour directories so always at least two hours).
 import glob
 import requests
 import os
@ -10,74 +14,76 @@ import os
 def get_nodes():
-    # either read a config file or query the database to get the addresses of
+	# either read a config file or query the database to get the addresses
-    # the other nodes
+	#  of the other nodes
-    # as a prototype can just hardcode some addresses.
+	# as a prototype can just hardcode some addresses.
-    nodes = []
+	nodes = []
-    return nodes
+	return nodes
 def list_remote_segments(node):
-    # return a list of paths
+	# return a list of paths
-    # obviously update path with real one
+	# obviously update path with real one
-    resp = requests.get(node + '/wubloader/segment_list')
+	resp = requests.get(node + '/wubloader/segment_list')
-    remote_segments = resp.json() #replace with appropriate parser
+	remote_segments = resp.json() #replace with appropriate parser
-    return remote_segments
+	return remote_segments
 #based on _get_segment in downloader/main
 #should have a more general shared version of this
 def get_remote_segment(node, segment):
-    # obviously update path with real one
+	# obviously update path with real one
-    resp = requests.get(node + '/wubloader/segments/' + segment, stream=True)
+	resp = requests.get(node + '/wubloader/segments/' + segment, stream=True)
-    with open('temp_backfill', 'w') as f:
+	with open('temp_backfill', 'w') as f:
-        for chunk in resp.iter_content(8192):
+		for chunk in resp.iter_content(8192):
-            f.write(chunk)
+			f.write(chunk)
-    os.rename(temp, segment)
+	os.rename(temp, segment)
 def back_fill(base_dir, nodes=None):
-    # loop over nodes asking for a list of segments then downloads any segments
+	# loop over nodes asking for a list of segments then downloads any 
-    # it doesn't have
+	# segments it doesn't have
-    if nodes is None:
+	if nodes is None:
-        nodes = get_nodes()
+		nodes = get_nodes()
-    for node in nodes:
+	for node in nodes:
-        # need to figure out how to properly check whether this node is the
+		# need to figure out how to properly check whether this node is
-        # same
+		# the same
-        if node == 'localhost':
+		if node == 'localhost':
-            continue
+			continue
-        # not sure how much we want to hard code the search
+		# not sure how much we want to hard code the search
-        local_segments = set(glob.glob(base_dir + '/*/*/*.ts'))
+		# replace with something from the restreamer
 		local_segments = set(glob.glob(base_dir + '/*/*/*.ts'))
-        remote_segments = set(list_remote_segments(node))
+		remote_segments = set(list_remote_segments(node))
-        missing_segments = remote_segments - local_segments
+		missing_segments = remote_segments - local_segments
-        
+		
-        for missing_segment in missing_segments:
+		for missing_segment in missing_segments:
-            get_remote_segment(node, missing_segment)
+			get_remote_segment(node, missing_segment)
 def main(base_dir, wait_time=60):
-    None
+	None
-    # every wait_time call back_fill
+	# every wait_time call back_fill
-    # time from start of back_fill
+	# time from start of back_fill
-    # to keep things simple don't try two back_fills at the same time
+	# to keep things simple don't try two back_fills at the same time
-    # wait for previous one to start before launching second.
+	# wait for previous one to start before launching second.
-    # if it's taken more than wait_time for back_fill to run, start immediately
+	# if it's taken more than wait_time for back_fill to run, start
 	# immediately