forked from zerebubuth/openstreetmap-license-change
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathchange_bot.rb
407 lines (365 loc) · 12.5 KB
/
change_bot.rb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
require 'rubygems'
require './osm'
require './db'
require './actions'
require './tags'
require 'set'
class History
def initialize(versions)
# todo: ensure sort
@versions = versions
@tainted_tags = Hash.new
@clean_values = Hash.new
@cleans = Array.new
@acceptors = Array.new
@clean_geom = @versions.first.version_zero_geom
end
def each_version
@versions.each do |v|
yield v
end
end
def merge_clean_onto_clean(obj)
@cleans << true
@acceptors << true
@clean_values = obj.tags
case obj
when OSM::Node
@clean_geom = obj.geom
when OSM::Way
@clean_geom = obj.nodes.map {|n| [n, true]}
when OSM::Relation
@clean_geom = obj.members.map {|m| [m, true]}
end
end
def merge_clean_onto_dirty(obj)
# merge any value changes for non-tainted keys into the
# tag set.
is_fully_clean = true
clean_tags = obj.tags.select do |k, v|
any_tainted = @tainted_tags.has_key?(k) && !Tags.significant_tag?(@tainted_tags[k], v)
if any_tainted
is_fully_clean = false
end
not any_tainted
end
# figure out what needs to happen with the geometry
case obj
when OSM::Node
# ??? need to account for node movage?
@clean_geom = obj.geom
when OSM::Way
old_nds, old_clean = @clean_geom.empty? ? [[],[]] : @clean_geom.transpose
cur_nds, cur_clean = obj.nodes, obj.nodes.map { true }
new_clean = Util.diff_split(old_nds, old_clean, cur_nds, cur_clean)
@clean_geom = [cur_nds, new_clean].transpose
# check the clean-ness. if the new nodes are all clean, then this version
# may also be fully clean.
is_fully_clean = is_fully_clean && @clean_geom.all? {|n,c| c}
when OSM::Relation
old_mem, old_clean = @clean_geom.empty? ? [[],[]] : @clean_geom.transpose
cur_mem, cur_clean = obj.members, obj.members.map { true }
new_clean = Util.diff_split(old_mem, old_clean, cur_mem, cur_clean)
@clean_geom = [cur_mem, new_clean].transpose
is_fully_clean = is_fully_clean && @clean_geom.all? {|m,c| c}
end
@cleans << is_fully_clean
@acceptors << true
@clean_values.merge!(clean_tags)
end
def merge_dirty(obj)
geom_is_diff = case obj
when OSM::Node
@clean_geom != obj.geom
when OSM::Way
(@clean_geom.map {|n,c| n}) != obj.geom
when OSM::Relation
(@clean_geom.map {|m,c| m}) != obj.geom
end
if Tags.significant?(@clean_values, obj.tags) or geom_is_diff
@cleans << false
@acceptors << false
# tags which were created in this version of the object are
# now tainted :-(
@tainted_tags.merge!(obj.tags.select {|k,v| not @clean_values.has_key?(k)})
# tags which were modified from the previous clean version
# are also tainted as long as the change is significant :'(
keys_in_both = obj.tags.keys & @clean_values.keys
changed_keys = keys_in_both.select {|k| Tags.significant_tag?(@clean_values[k], obj.tags[k])}
@tainted_tags.merge!(obj.tags.select {|k,v| changed_keys.include? k})
# tags removed in the dirty version can be kept as deleted
# though.
(@clean_values.keys - obj.tags.keys).each {|k| @clean_values.delete(k)}
case obj
when OSM::Node
# can't use dirty geometry
when OSM::Way
if (@clean_geom.map {|n,c| n}) != obj.geom
old_nds, old_clean = @clean_geom.empty? ? [[],[]] : @clean_geom.transpose
cur_nds, cur_clean = obj.nodes, obj.nodes.map { false }
new_clean = Util.diff_split(old_nds, old_clean, cur_nds, cur_clean)
@clean_geom = [cur_nds, new_clean].transpose
end
when OSM::Relation
if (@clean_geom.map {|m,c| m}) != obj.geom
old_mem, old_clean = @clean_geom.empty? ? [[],[]] : @clean_geom.transpose
cur_mem, cur_clean = obj.members, obj.members.map { false }
new_clean = Util.diff_split(old_mem, old_clean, cur_mem, cur_clean)
@clean_geom = [cur_mem, new_clean].transpose
end
end
else
# if we get here then the tag changes weren't significant and
# the geometry was the same.
if is_clean?
merge_clean_onto_clean(obj)
else
merge_clean_onto_dirty(obj)
end
end
end
def is_clean?
@cleans.all?
end
def actions
first_act = nil
acts = Array.new
clean_flag = true
prev_obj = nil
max_version = nil
clean_history = Array.new
unredacts_later = Array.new
@versions.zip(@cleans).zip(@acceptors).map {|i| i.flatten}.each do |obj,clean,acceptor|
clean_flag = clean_flag && clean
# deleted objects are always clean
unless obj.visible
clean_flag = true
first_act = nil
end
clean_history << clean_flag
unless clean_flag
done = false
odbl_clean = Tags.odbl_clean?(obj.tags)
if (clean or acceptor) and
((prev_obj.nil? or obj.geom != prev_obj.geom) or
(odbl_clean))
case obj
when OSM::Node
if obj.tags.empty? or odbl_clean
act = :untagged
else
act = :clean
new_obj = obj.clone
end
when OSM::Way
if odbl_clean or ((obj.tags == @clean_values) && ((@clean_geom.select {|n,c| c}.map {|n,c| n}) == obj.nodes))
act = :untagged
else
act = :clean
new_obj = obj.clone
new_obj.nodes = @clean_geom.select {|n,c| c}.map {|n,c| n}
end
when OSM::Relation
if odbl_clean or ((obj.tags == @clean_values) && ((@clean_geom.select {|m,c| c}.map {|m,c| m}) == obj.members))
act = :untagged
else
act = :clean
new_obj = obj.clone
new_obj.members = @clean_geom.select {|m,c| c}.map {|m,c| m}
end
end
if act == :untagged
first_act = nil
clean_flag = true
done = true
elsif act == :clean
@clean_values.delete_if {|k,v| @tainted_tags.has_key? k}
new_obj.tags = @clean_values
first_act = Edit[new_obj]
acts << Redact[obj.class, obj.element_id, obj.version, acceptor ? :visible : :hidden]
unredacts_later << obj.version if clean
clean_flag = true
done = true
end
end
if clean and not clean_flag
# if it exactly matches a previous clean version then it's
# a revert and is clean.
reverts = @versions.zip(clean_history).select {|hobj, ch| (obj.tags == hobj.tags) and (obj.geom == hobj.geom) and ch}
unless reverts.empty?
clean_flag = true
first_act = nil
done = true
end
end
if not done
if first_act.nil?
if prev_obj.nil?
first_act = Delete[obj.class, obj.element_id]
else
first_act = Edit[prev_obj]
end
end
acts << Redact[obj.class, obj.element_id, obj.version, acceptor ? :visible : :hidden]
end
end
prev_obj = obj
max_version = obj.version
end
# need to adjust any edit actions to represent changes from
# the last version of the object we've seen.
if (not first_act.nil?) and (first_act.class == Edit)
acts.delete_if {|o| (o.version != max_version) and unredacts_later.include?(o.version) }
unredacts_later = Array.new
first_act = first_act.clone
first_act.obj.changeset_id = -1
first_act.obj.version = max_version
first_act.obj.tags = @clean_values
end
first_act.nil? ? acts : [first_act] + acts
end
end
class ChangeBot
attr_reader :redactions
def initialize(db)
@db = db
@pending_deletes = Hash.new
@pending_edits = Hash.new
@redactions = Array.new
end
def action_for(history)
# special case for excluded items
klass = history.first.class
element_id = history.first.element_id
if @db.exclude?(klass, element_id)
return [Delete[klass, element_id]] + history.map {|e| Redact[klass, element_id, e.version, :hidden]}
end
# otherwise, normal process.
h = History.new(history)
h.each_version do |element|
if changeset_is_accepted?(element.changeset_id)
if h.is_clean?
h.merge_clean_onto_clean(element)
else
h.merge_clean_onto_dirty(element)
end
else
h.merge_dirty(element)
end
end
h.actions
end
def process!(klass, elt_id)
# grab history from the database
history = if klass == OSM::Node
@db.node(elt_id)
elsif klass == OSM::Way
@db.way(elt_id)
elsif klass == OSM::Relation
@db.relation(elt_id)
end
# get the actions for it
actions = action_for(history)
# split up the actions into edits, deletes and redactions
actions.each do |act|
case act
when Edit
@pending_edits[[klass, elt_id]] = act
when Delete
@pending_deletes[[klass, elt_id]] = act
when Redact
@redactions << act
end
end
end
def process_all!
@db.nodes.keys.each {|n| process!(OSM::Node, n)}
@db.ways.keys.each {|w| process!(OSM::Way, w)}
@db.relations.keys.each {|r| process!(OSM::Relation, r)}
end
def as_changeset
changeset = Array.new
# go over the pending deletes. each of these may affect other objects
# which aren't even in the set of objects that we wanted to process.
# in that case, we'll need to create a new edit on that other object
# to remove the current object from it first.
#
# in order to get this right we need to process the node deletions
# first, then the way deletions, then the relation deletions. the
# reason for this is that a node deletion can affect ways and
# relations, causing them to also be deleted. ways deletions, in turn,
# can cascade to relation deletions but, importantly, not to node
# deletions.
#
[OSM::Node, OSM::Way, OSM::Relation].each do |klass|
ids = Array.new
@pending_deletes.each do |id, del|
if id[0] == klass
ids << id[1]
end
end
ids.each {|i| process_delete([klass, i], @pending_deletes[[klass, i]])}
end
# we should now be OK to do the edits, removing references to
# deleted objects.
[OSM::Relation, OSM::Way, OSM::Node].each do |klass|
@pending_edits.each do |id, edit|
if id[0] == klass
changeset << edit
end
end
end
# having removed references, we should be OK to do the deletes
[OSM::Relation, OSM::Way, OSM::Node].each do |klass|
@pending_deletes.each do |id, del|
if id[0] == klass
changeset << del
end
end
end
return changeset
end
def process_delete(id, del)
references = @db.objects_using(*id)
references.each do |ref_obj|
ref_id = [ref_obj.class, ref_obj.element_id]
# if we're planning to delete this item anyway, then just leave
# it - no need to alter that edit.
unless @pending_deletes.has_key? ref_id
# get the edit we're planning to do, if there is one, otherwise
# the current object version.
edit = if @pending_edits.has_key?(ref_id)
@pending_edits[ref_id]
else
obj = ref_obj.clone
obj.changeset_id = -1
Edit[obj]
end
kill_object = false
case edit.obj
when OSM::Node
raise Exception.new("Node found as referencing object. BUG!")
when OSM::Way
edit.obj.nodes.select! {|n| n != id[1]}
kill_object = edit.obj.nodes.size < 2
when OSM::Relation
edit.obj.members.select! {|m| m.type != id[0] || m.ref != id[1]}
kill_object = edit.obj.members.empty?
end
if kill_object
@pending_edits.delete ref_id
@pending_deletes[ref_id] = Delete[*ref_id]
else
@pending_edits[ref_id] = edit
end
end
end
end
def changeset_is_accepted?(changeset_id)
cs = @db.changeset(changeset_id)
accepted = cs.user.accepted_cts?
accepted = accepted or (not cs.user.adopter.nil? and cs.user.adopter.accepted_cts?)
accepted = accepted or cs.override_accepted?
return accepted
end
end