Context Navigation

source: trunk/misc/coding_tools/make-canary-files.py

Visit:

Last change on this file was 4ac60c5, checked in by Alexandre Detiste <alexandre.detiste@…>, at 2024-12-21T13:57:09Z
vendor cmp()
Property mode set to `100644`
File size: 5.3 KB

Line
1	#!/usr/bin/env python
2
3
4	"""
5	Given a list of nodeids and a 'convergence' file, create a bunch of files
6	that will (when encoded at k=1,N=1) be uploaded to specific nodeids.
7
8	Run this as follows:
9
10	make-canary-files.py -c PATH/TO/convergence -n PATH/TO/nodeids -k 1 -N 1
11
12	It will create a directory named 'canaries', with one file per nodeid named
13	'$NODEID-$NICKNAME.txt', that contains some random text.
14
15	The 'nodeids' file should contain one base32 nodeid per line, followed by the
16	optional nickname, like:
17
18	---
19	5yyqu2hbvbh3rgtsgxrmmg4g77b6p3yo server12
20	vb7vm2mneyid5jbyvcbk2wb5icdhwtun server13
21	...
22	---
23
24	The resulting 'canaries/5yyqu2hbvbh3rgtsgxrmmg4g77b6p3yo-server12.txt' file
25	will, when uploaded with the given (convergence,k,N) pair, have its first
26	share placed on the 5yyq/server12 storage server. If N>1, the other shares
27	will be placed elsewhere, of course.
28
29	This tool can be useful to construct a set of 'canary' files, which can then
30	be uploaded to storage servers, and later downloaded to test a grid's health.
31	If you are able to download the canary for server12 via some tahoe node X,
32	then the following properties are known to be true:
33
34	node X is running, and has established a connection to server12
35	server12 is running, and returning data for at least the given file
36
37	Using k=1/N=1 creates a separate test for each server. The test process is
38	then to download the whole directory of files (perhaps with a t=deep-check
39	operation).
40
41	Alternatively, you could upload with the usual k=3/N=10 and then move/delete
42	shares to put all N shares on a single server.
43
44	Note that any changes to the nodeid list will affect the placement of shares.
45	Shares should be uploaded with the same nodeid list as this tool used when
46	constructing the files.
47
48	Also note that this tool uses the Tahoe codebase, so it should be run on a
49	system where Tahoe is installed, or in a source tree with setup.py like this:
50
51	setup.py run_with_pythonpath -p -c 'misc/make-canary-files.py ARGS..'
52	"""
53
54	import os, hashlib
55	from twisted.python import usage
56	from allmydata.immutable import upload
57	from allmydata.util import base32
58
59	def cmp(a, b):
60	return (a > b) - (a < b)
61
62	class Options(usage.Options):
63	optParameters = [
64	("convergence", "c", None, "path to NODEDIR/private/convergence"),
65	("nodeids", "n", None, "path to file with one base32 nodeid per line"),
66	("k", "k", 1, "number of necessary shares, defaults to 1", int),
67	("N", "N", 1, "number of total shares, defaults to 1", int),
68	]
69	optFlags = [
70	("verbose", "v", "Be noisy"),
71	]
72
73	opts = Options()
74	opts.parseOptions()
75
76	verbose = bool(opts["verbose"])
77
78	nodes = {}
79	for line in open(opts["nodeids"], "r").readlines():
80	line = line.strip()
81	if not line or line.startswith("#"):
82	continue
83	pieces = line.split(None, 1)
84	if len(pieces) == 2:
85	nodeid_s, nickname = pieces
86	else:
87	nodeid_s = pieces[0]
88	nickname = None
89	nodeid = base32.a2b(nodeid_s)
90	nodes[nodeid] = nickname
91
92	if opts["k"] != 3 or opts["N"] != 10:
93	print("note: using non-default k/N requires patching the Tahoe code")
94	print("src/allmydata/client.py line 55, DEFAULT_ENCODING_PARAMETERS")
95
96	convergence_file = os.path.expanduser(opts["convergence"])
97	convergence_s = open(convergence_file, "rb").read().strip()
98	convergence = base32.a2b(convergence_s)
99
100	def get_permuted_peers(key):
101	results = []
102	for nodeid in nodes:
103	permuted = hashlib.sha1(key + nodeid).digest()
104	results.append((permuted, nodeid))
105	results.sort(lambda a,b: cmp(a[0], b[0]))
106	return [ r[1] for r in results ]
107
108	def find_share_for_target(target):
109	target_s = base32.b2a(target)
110	prefix = "The first share of this file will be placed on " + target_s + "\n"
111	prefix += "This data is random: "
112	attempts = 0
113	while True:
114	attempts += 1
115	suffix = base32.b2a(os.urandom(10))
116	if verbose: print(" trying", suffix, end=' ')
117	data = prefix + suffix + "\n"
118	assert len(data) > 55 # no LIT files
119	# now, what storage index will this get?
120	u = upload.Data(data, convergence)
121	eu = upload.EncryptAnUploadable(u)
122	d = eu.get_storage_index() # this happens to run synchronously
123	def _got_si(si, data=data):
124	if verbose: print("SI", base32.b2a(si), end=' ')
125	peerlist = get_permuted_peers(si)
126	if peerlist[0] == target:
127	# great!
128	if verbose: print(" yay!")
129	fn = base32.b2a(target)
130	if nodes[target]:
131	nickname = nodes[target].replace("/", "_")
132	fn += "-" + nickname
133	fn += ".txt"
134	fn = os.path.join("canaries", fn)
135	open(fn, "w").write(data)
136	return True
137	# nope, must try again
138	if verbose: print(" boo")
139	return False
140	d.addCallback(_got_si)
141	# get sneaky and look inside the Deferred for the synchronous result
142	if d.result:
143	return attempts
144
145	os.mkdir("canaries")
146	attempts = []
147	for target in nodes:
148	target_s = base32.b2a(target)
149	print("working on", target_s)
150	attempts.append(find_share_for_target(target))
151	print("done")
152	print("%d attempts total, avg %d per target, max %d" % \
153	(sum(attempts), 1.0* sum(attempts) / len(nodes), max(attempts)))
154
155

Note: See TracBrowser for help on using the repository browser.

Download in other formats: