Commit 6d2cf16ad6630bf7145c0e7a2c9d6b78f0d66e67
1 parent
55041d0f
Exists in
master
and in
1 other branch
move bunch of items from test_api to prune_db
Showing
2 changed files
with
233 additions
and
219 deletions
Show diff stats
lib/tasks/prune_db.rake
... | ... | @@ -17,6 +17,223 @@ namespace :prune_db do |
17 | 17 | end |
18 | 18 | end |
19 | 19 | |
20 | + desc "Generate appearances for any votes that have no current appearance, should only need to be run once" | |
21 | + task(:generate_appearances_for_existing_votes => :environment) do | |
22 | + votes = Vote.all | |
23 | + | |
24 | + count = 0 | |
25 | + votes.each do |v| | |
26 | + if v.appearance.nil? | |
27 | + print "." | |
28 | + a = Appearance.create(:voter_id => v.voter_id, :site_id => v.site_id, :prompt_id => v.prompt_id, :question_id => v.question_id, :created_at => v.created_at, :updated_at => v.updated_at) | |
29 | + v.appearance = a | |
30 | + v.save | |
31 | + | |
32 | + count += 1 | |
33 | + end | |
34 | + end | |
35 | + | |
36 | + print count | |
37 | + end | |
38 | + | |
39 | + desc "Don't run unless you know what you are doing" | |
40 | + task(:generate_lots_of_votes => :environment) do | |
41 | + if Rails.env.production? | |
42 | + print "You probably don't want to run this in production as it will falsify a bunch of random votes" | |
43 | + end | |
44 | + | |
45 | + | |
46 | + current_user = User.first | |
47 | + 1000.times do |n| | |
48 | + puts "#{n} votes completed" if n % 100 == 0 | |
49 | + question = Question.find(214) # test question change as needed | |
50 | + @prompt = question.catchup_choose_prompt(1).first | |
51 | + @appearance = current_user.record_appearance(current_user.default_visitor, @prompt) | |
52 | + | |
53 | + direction = (rand(2) == 0) ? "left" : "right" | |
54 | + current_user.record_vote(:prompt => @prompt, :direction => direction, :appearance_lookup => @appearance.lookup) | |
55 | + end | |
56 | + | |
57 | + end | |
58 | + | |
59 | + desc "Dump votes of a question by left vs right id" | |
60 | + task(:make_csv => :environment) do | |
61 | + | |
62 | + q = Question.find(214) | |
63 | + | |
64 | + | |
65 | + the_prompts = q.prompts_hash_by_choice_ids | |
66 | + | |
67 | + #hash_of_choice_ids_from_left_to_right_to_votes | |
68 | + the_hash = {} | |
69 | + q.choices.each do |l| | |
70 | + q.choices.each do |r| | |
71 | + next if l.id == r.id | |
72 | + | |
73 | + if not the_hash.has_key?(l.id) | |
74 | + the_hash[l.id] = {} | |
75 | + the_hash[l.id][l.id] = 0 | |
76 | + end | |
77 | + | |
78 | + p = the_prompts["#{l.id}, #{r.id}"] | |
79 | + if p.nil? | |
80 | + the_hash[l.id][r.id] = 0 | |
81 | + else | |
82 | + the_hash[l.id][r.id] = p.appearances.size | |
83 | + end | |
84 | + end | |
85 | + end | |
86 | + | |
87 | + the_hash.sort.each do |xval, row| | |
88 | + rowarray = [] | |
89 | + row.sort.each do |yval, cell| | |
90 | + rowarray << cell | |
91 | + end | |
92 | + puts rowarray.join(", ") | |
93 | + end | |
94 | + end | |
95 | + | |
96 | + desc "Should only need to be run once" | |
97 | + task(:generate_all_possible_prompts => :environment) do | |
98 | + Question.find(:all).each do |q| | |
99 | + choices = q.choices | |
100 | + if q.prompts.size > choices.size**2 - choices.size | |
101 | + print "ERROR: #{q.id}\n" | |
102 | + next | |
103 | + elsif q.prompts.size == choices.size**2 - choices.size | |
104 | + print "#{q.id} has enough prompts, skipping...\n" | |
105 | + next | |
106 | + else | |
107 | + print "#{q.id} should add #{(choices.size ** 2 - choices.size) - q.prompts.size}\n" | |
108 | + | |
109 | + end | |
110 | + created_timestring = q.created_at.to_s(:db) | |
111 | + updated_timestring = Time.now.to_s(:db) #isn't rails awesome? | |
112 | + promptscount=0 | |
113 | + inserts = [] | |
114 | + the_prompts = Prompt.find(:all, :select => 'id, left_choice_id, right_choice_id', :conditions => {:question_id => q.id}) | |
115 | + | |
116 | + the_prompts_hash = {} | |
117 | + the_prompts.each do |p| | |
118 | + the_prompts_hash["#{p.left_choice_id},#{p.right_choice_id}"] = 1 | |
119 | + end | |
120 | + | |
121 | + choices.each do |l| | |
122 | + choices.each do |r| | |
123 | + if l.id == r.id | |
124 | + next | |
125 | + else | |
126 | + #p = the_prompts.find{|o| o.left_choice_id == l.id && o.right_choice_id == r.id} | |
127 | + keystring = "#{l.id},#{r.id}" | |
128 | + p = the_prompts_hash[keystring] | |
129 | + if p.nil? | |
130 | + inserts.push("(NULL, #{q.id}, NULL, #{l.id}, '#{created_timestring}', '#{updated_timestring}', NULL, 0, #{r.id}, NULL, NULL)") | |
131 | + promptscount+=1 | |
132 | + end | |
133 | + | |
134 | + end | |
135 | + | |
136 | + end | |
137 | + end | |
138 | + | |
139 | + print "Added #{promptscount} to #{q.id}\n" | |
140 | + sql = "INSERT INTO `prompts` (`algorithm_id`, `question_id`, `voter_id`, `left_choice_id`, `created_at`, `updated_at`, `tracking`, `votes_count`, `right_choice_id`, `active`, `randomkey`) VALUES #{inserts.join(', ')}" | |
141 | + unless inserts.empty? | |
142 | + ActiveRecord::Base.connection.execute(sql) | |
143 | + end | |
144 | + | |
145 | + Question.update_counters(q.id, :prompts_count => promptscount) | |
146 | + | |
147 | + | |
148 | + end | |
149 | + | |
150 | + | |
151 | + | |
152 | + end | |
153 | + | |
154 | + | |
155 | + | |
156 | + desc "Generate past density information" | |
157 | + task(:generate_past_densities => :environment) do | |
158 | + #this is not elegant, but should only be run once, so quick and dirty wins | |
159 | + | |
160 | + start_date = Vote.find(:all, :conditions => 'loser_choice_id IS NOT NULL', :order => :created_at, :limit => 1).first.created_at.to_date | |
161 | + start_date.upto(Date.today) do |the_date| | |
162 | + questions = Question.find(:all, :conditions => ['created_at < ?', the_date]) | |
163 | + | |
164 | + print the_date.to_s | |
165 | + questions.each do |q| | |
166 | + puts q.id | |
167 | + relevant_choices = q.choices.find(:all, :conditions => ['created_at < ?', the_date]) | |
168 | + | |
169 | + seed_choices = 0 | |
170 | + | |
171 | + if relevant_choices == 0 | |
172 | + next | |
173 | + #this question had not been created yet | |
174 | + end | |
175 | + | |
176 | + relevant_choices.each do |c| | |
177 | + if !c.user_created | |
178 | + seed_choices+=1 | |
179 | + end | |
180 | + | |
181 | + end | |
182 | + | |
183 | + nonseed_choices = relevant_choices.size - seed_choices | |
184 | + | |
185 | + seed_seed_total = seed_choices **2 - seed_choices | |
186 | + nonseed_nonseed_total = nonseed_choices **2 - nonseed_choices | |
187 | + seed_nonseed_total = seed_choices * nonseed_choices | |
188 | + nonseed_seed_total = seed_choices * nonseed_choices | |
189 | + | |
190 | + seed_seed_sum = 0 | |
191 | + seed_nonseed_sum= 0 | |
192 | + nonseed_seed_sum= 0 | |
193 | + nonseed_nonseed_sum= 0 | |
194 | + | |
195 | + q.appearances.find_each(:conditions => ['prompt_id IS NOT NULL AND created_at < ?', the_date]) do |a| | |
196 | + | |
197 | + p = a.prompt | |
198 | + if p.left_choice.user_created == false && p.right_choice.user_created == false | |
199 | + seed_seed_sum += 1 | |
200 | + elsif p.left_choice.user_created == false && p.right_choice.user_created == true | |
201 | + seed_nonseed_sum += 1 | |
202 | + elsif p.left_choice.user_created == true && p.right_choice.user_created == false | |
203 | + nonseed_seed_sum += 1 | |
204 | + elsif p.left_choice.user_created == true && p.right_choice.user_created == true | |
205 | + nonseed_nonseed_sum += 1 | |
206 | + end | |
207 | + end | |
208 | + | |
209 | + densities = {} | |
210 | + densities[:seed_seed] = seed_seed_sum.to_f / seed_seed_total.to_f | |
211 | + densities[:seed_nonseed] = seed_nonseed_sum.to_f / seed_nonseed_total.to_f | |
212 | + densities[:nonseed_seed] = nonseed_seed_sum.to_f / nonseed_seed_total.to_f | |
213 | + densities[:nonseed_nonseed] = nonseed_nonseed_sum.to_f / nonseed_nonseed_total.to_f | |
214 | + | |
215 | + densities.each do |type, average| | |
216 | + d = Density.new | |
217 | + d.created_at = the_date | |
218 | + d.question_id = q.id | |
219 | + d.prompt_type = type.to_s | |
220 | + d.value = average.nan? ? nil : average | |
221 | + d.save! | |
222 | + end | |
223 | + | |
224 | + puts "Seed_seed sum: #{seed_seed_sum}, seed_seed total num: #{seed_seed_total}" | |
225 | + puts "Seed_nonseed sum: #{seed_nonseed_sum}, seed_nonseed total num: #{seed_nonseed_total}" | |
226 | + puts "Nonseed_seed sum: #{nonseed_seed_sum}, nonseed_seed total num: #{nonseed_seed_total}" | |
227 | + puts "Nonseed_nonseed sum: #{nonseed_nonseed_sum}, nonseed_nonseed total num: #{nonseed_nonseed_total}" | |
228 | + | |
229 | + | |
230 | + end | |
231 | + | |
232 | + end | |
233 | + | |
234 | + end | |
235 | + | |
236 | + | |
20 | 237 | desc "Invalidates votes with bad response times" |
21 | 238 | task :invalidate_votes_with_bad_response_times => :environment do |
22 | 239 | badvotes = [] | ... | ... |
lib/tasks/test_api.rake
... | ... | @@ -68,223 +68,6 @@ namespace :test_api do |
68 | 68 | return error_message.blank? ? [success_message, false] : [error_message, true] |
69 | 69 | end |
70 | 70 | |
71 | - desc "Don't run unless you know what you are doing" | |
72 | - task(:generate_lots_of_votes => :environment) do | |
73 | - if Rails.env.production? | |
74 | - print "You probably don't want to run this in production as it will falsify a bunch of random votes" | |
75 | - end | |
76 | - | |
77 | - | |
78 | - current_user = User.first | |
79 | - 1000.times do |n| | |
80 | - puts "#{n} votes completed" if n % 100 == 0 | |
81 | - question = Question.find(214) # test question change as needed | |
82 | - @prompt = question.catchup_choose_prompt(1).first | |
83 | - @appearance = current_user.record_appearance(current_user.default_visitor, @prompt) | |
84 | - | |
85 | - direction = (rand(2) == 0) ? "left" : "right" | |
86 | - current_user.record_vote(:prompt => @prompt, :direction => direction, :appearance_lookup => @appearance.lookup) | |
87 | - end | |
88 | - | |
89 | - end | |
90 | - | |
91 | - desc "Generate appearances for any votes that have no current appearance, should only need to be run once" | |
92 | - task(:generate_appearances_for_existing_votes => :environment) do | |
93 | - votes = Vote.all | |
94 | - | |
95 | - count = 0 | |
96 | - votes.each do |v| | |
97 | - if v.appearance.nil? | |
98 | - print "." | |
99 | - a = Appearance.create(:voter_id => v.voter_id, :site_id => v.site_id, :prompt_id => v.prompt_id, :question_id => v.question_id, :created_at => v.created_at, :updated_at => v.updated_at) | |
100 | - v.appearance = a | |
101 | - v.save | |
102 | - | |
103 | - count += 1 | |
104 | - end | |
105 | - end | |
106 | - | |
107 | - print count | |
108 | - end | |
109 | - | |
110 | - | |
111 | - desc "Generate past density information" | |
112 | - task(:generate_past_densities => :environment) do | |
113 | - #this is not elegant, but should only be run once, so quick and dirty wins | |
114 | - | |
115 | - start_date = Vote.find(:all, :conditions => 'loser_choice_id IS NOT NULL', :order => :created_at, :limit => 1).first.created_at.to_date | |
116 | - start_date.upto(Date.today) do |the_date| | |
117 | - questions = Question.find(:all, :conditions => ['created_at < ?', the_date]) | |
118 | - | |
119 | - print the_date.to_s | |
120 | - questions.each do |q| | |
121 | - puts q.id | |
122 | - relevant_choices = q.choices.find(:all, :conditions => ['created_at < ?', the_date]) | |
123 | - | |
124 | - seed_choices = 0 | |
125 | - | |
126 | - if relevant_choices == 0 | |
127 | - next | |
128 | - #this question had not been created yet | |
129 | - end | |
130 | - | |
131 | - relevant_choices.each do |c| | |
132 | - if !c.user_created | |
133 | - seed_choices+=1 | |
134 | - end | |
135 | - | |
136 | - end | |
137 | - | |
138 | - nonseed_choices = relevant_choices.size - seed_choices | |
139 | - | |
140 | - seed_seed_total = seed_choices **2 - seed_choices | |
141 | - nonseed_nonseed_total = nonseed_choices **2 - nonseed_choices | |
142 | - seed_nonseed_total = seed_choices * nonseed_choices | |
143 | - nonseed_seed_total = seed_choices * nonseed_choices | |
144 | - | |
145 | - seed_seed_sum = 0 | |
146 | - seed_nonseed_sum= 0 | |
147 | - nonseed_seed_sum= 0 | |
148 | - nonseed_nonseed_sum= 0 | |
149 | - | |
150 | - q.appearances.find_each(:conditions => ['prompt_id IS NOT NULL AND created_at < ?', the_date]) do |a| | |
151 | - | |
152 | - p = a.prompt | |
153 | - if p.left_choice.user_created == false && p.right_choice.user_created == false | |
154 | - seed_seed_sum += 1 | |
155 | - elsif p.left_choice.user_created == false && p.right_choice.user_created == true | |
156 | - seed_nonseed_sum += 1 | |
157 | - elsif p.left_choice.user_created == true && p.right_choice.user_created == false | |
158 | - nonseed_seed_sum += 1 | |
159 | - elsif p.left_choice.user_created == true && p.right_choice.user_created == true | |
160 | - nonseed_nonseed_sum += 1 | |
161 | - end | |
162 | - end | |
163 | - | |
164 | - densities = {} | |
165 | - densities[:seed_seed] = seed_seed_sum.to_f / seed_seed_total.to_f | |
166 | - densities[:seed_nonseed] = seed_nonseed_sum.to_f / seed_nonseed_total.to_f | |
167 | - densities[:nonseed_seed] = nonseed_seed_sum.to_f / nonseed_seed_total.to_f | |
168 | - densities[:nonseed_nonseed] = nonseed_nonseed_sum.to_f / nonseed_nonseed_total.to_f | |
169 | - | |
170 | - densities.each do |type, average| | |
171 | - d = Density.new | |
172 | - d.created_at = the_date | |
173 | - d.question_id = q.id | |
174 | - d.prompt_type = type.to_s | |
175 | - d.value = average.nan? ? nil : average | |
176 | - d.save! | |
177 | - end | |
178 | - | |
179 | - puts "Seed_seed sum: #{seed_seed_sum}, seed_seed total num: #{seed_seed_total}" | |
180 | - puts "Seed_nonseed sum: #{seed_nonseed_sum}, seed_nonseed total num: #{seed_nonseed_total}" | |
181 | - puts "Nonseed_seed sum: #{nonseed_seed_sum}, nonseed_seed total num: #{nonseed_seed_total}" | |
182 | - puts "Nonseed_nonseed sum: #{nonseed_nonseed_sum}, nonseed_nonseed total num: #{nonseed_nonseed_total}" | |
183 | - | |
184 | - | |
185 | - end | |
186 | - | |
187 | - end | |
188 | - | |
189 | - end | |
190 | - | |
191 | - | |
192 | - desc "Should only need to be run once" | |
193 | - task(:generate_all_possible_prompts => :environment) do | |
194 | - Question.find(:all).each do |q| | |
195 | - choices = q.choices | |
196 | - if q.prompts.size > choices.size**2 - choices.size | |
197 | - print "ERROR: #{q.id}\n" | |
198 | - next | |
199 | - elsif q.prompts.size == choices.size**2 - choices.size | |
200 | - print "#{q.id} has enough prompts, skipping...\n" | |
201 | - next | |
202 | - else | |
203 | - print "#{q.id} should add #{(choices.size ** 2 - choices.size) - q.prompts.size}\n" | |
204 | - | |
205 | - end | |
206 | - created_timestring = q.created_at.to_s(:db) | |
207 | - updated_timestring = Time.now.to_s(:db) #isn't rails awesome? | |
208 | - promptscount=0 | |
209 | - inserts = [] | |
210 | - the_prompts = Prompt.find(:all, :select => 'id, left_choice_id, right_choice_id', :conditions => {:question_id => q.id}) | |
211 | - | |
212 | - the_prompts_hash = {} | |
213 | - the_prompts.each do |p| | |
214 | - the_prompts_hash["#{p.left_choice_id},#{p.right_choice_id}"] = 1 | |
215 | - end | |
216 | - | |
217 | - choices.each do |l| | |
218 | - choices.each do |r| | |
219 | - if l.id == r.id | |
220 | - next | |
221 | - else | |
222 | - #p = the_prompts.find{|o| o.left_choice_id == l.id && o.right_choice_id == r.id} | |
223 | - keystring = "#{l.id},#{r.id}" | |
224 | - p = the_prompts_hash[keystring] | |
225 | - if p.nil? | |
226 | - inserts.push("(NULL, #{q.id}, NULL, #{l.id}, '#{created_timestring}', '#{updated_timestring}', NULL, 0, #{r.id}, NULL, NULL)") | |
227 | - promptscount+=1 | |
228 | - end | |
229 | - | |
230 | - end | |
231 | - | |
232 | - end | |
233 | - end | |
234 | - | |
235 | - print "Added #{promptscount} to #{q.id}\n" | |
236 | - sql = "INSERT INTO `prompts` (`algorithm_id`, `question_id`, `voter_id`, `left_choice_id`, `created_at`, `updated_at`, `tracking`, `votes_count`, `right_choice_id`, `active`, `randomkey`) VALUES #{inserts.join(', ')}" | |
237 | - unless inserts.empty? | |
238 | - ActiveRecord::Base.connection.execute(sql) | |
239 | - end | |
240 | - | |
241 | - Question.update_counters(q.id, :prompts_count => promptscount) | |
242 | - | |
243 | - | |
244 | - end | |
245 | - | |
246 | - | |
247 | - | |
248 | - end | |
249 | - | |
250 | - | |
251 | - desc "Dump votes of a question by left vs right id" | |
252 | - task(:make_csv => :environment) do | |
253 | - | |
254 | - q = Question.find(214) | |
255 | - | |
256 | - | |
257 | - the_prompts = q.prompts_hash_by_choice_ids | |
258 | - | |
259 | - #hash_of_choice_ids_from_left_to_right_to_votes | |
260 | - the_hash = {} | |
261 | - q.choices.each do |l| | |
262 | - q.choices.each do |r| | |
263 | - next if l.id == r.id | |
264 | - | |
265 | - if not the_hash.has_key?(l.id) | |
266 | - the_hash[l.id] = {} | |
267 | - the_hash[l.id][l.id] = 0 | |
268 | - end | |
269 | - | |
270 | - p = the_prompts["#{l.id}, #{r.id}"] | |
271 | - if p.nil? | |
272 | - the_hash[l.id][r.id] = 0 | |
273 | - else | |
274 | - the_hash[l.id][r.id] = p.appearances.size | |
275 | - end | |
276 | - end | |
277 | - end | |
278 | - | |
279 | - the_hash.sort.each do |xval, row| | |
280 | - rowarray = [] | |
281 | - row.sort.each do |yval, cell| | |
282 | - rowarray << cell | |
283 | - end | |
284 | - puts rowarray.join(", ") | |
285 | - end | |
286 | - end | |
287 | - | |
288 | 71 | |
289 | 72 | desc "Generate density information for each question - should be run nightly" |
290 | 73 | task(:generate_density_information => :environment) do |
... | ... | @@ -663,8 +446,11 @@ namespace :test_api do |
663 | 446 | |
664 | 447 | desc "Ensure that a question has: answered_appearances == votes + skips" |
665 | 448 | task :answered_appearances_equals_votes_and_skips, [:question_id] => :environment do |t, args| |
666 | - question = Question.find(args[:question_id]) | |
667 | - puts answered_appearances_equals_votes_and_skips(question).inspect | |
449 | + a = cleanup_args(args) | |
450 | + questions = Question.find(a[:question_id]) | |
451 | + questions.each do |question| | |
452 | + puts answered_appearances_equals_votes_and_skips(question).inspect | |
453 | + end | |
668 | 454 | end |
669 | 455 | |
670 | 456 | def answered_appearances_equals_votes_and_skips(question) |
... | ... | @@ -726,3 +512,14 @@ namespace :test_api do |
726 | 512 | end |
727 | 513 | end |
728 | 514 | |
515 | +def cleanup_args(args) | |
516 | + args.with_defaults(:question_id => :all, :choice_id => :all) | |
517 | + a = args.to_hash | |
518 | + if a[:question_id] != :all | |
519 | + a[:question_id] = a[:question_id].split(".") | |
520 | + end | |
521 | + if a[:choice_id] != :all | |
522 | + a[:choice_id] = a[:choice_id].split(".") | |
523 | + end | |
524 | + a | |
525 | +end | ... | ... |